xref: /petsc/src/ksp/pc/impls/bddc/bddcprivate.c (revision c964aadf5f296a8909ebf687d295bed23b4925d3)
11cf9b237SStefano Zampini #include <../src/mat/impls/aij/seq/aij.h>
2ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddc.h>
3ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddcprivate.h>
4c80a6c00SStefano Zampini #include <petscdmplex.h>
5674ae819SStefano Zampini #include <petscblaslapack.h>
6daf8a457SStefano Zampini #include <petsc/private/sfimpl.h>
7c80a6c00SStefano Zampini #include <petsc/private/dmpleximpl.h>
8674ae819SStefano Zampini 
91e0482f5SStefano Zampini static PetscErrorCode MatMPIAIJRestrict(Mat,MPI_Comm,Mat*);
101e0482f5SStefano Zampini 
11f498cd09SStefano Zampini /* if range is true,  it returns B s.t. span{B} = range(A)
12f498cd09SStefano Zampini    if range is false, it returns B s.t. range(B) _|_ range(A) */
13f498cd09SStefano Zampini PetscErrorCode MatDenseOrthogonalRangeOrComplement(Mat A, PetscBool range, PetscInt lw, PetscScalar *work, PetscReal *rwork, Mat *B)
14a13144ffSStefano Zampini {
15a13144ffSStefano Zampini #if !defined(PETSC_USE_COMPLEX)
16a13144ffSStefano Zampini   PetscScalar    *uwork,*data,*U, ds = 0.;
17a13144ffSStefano Zampini   PetscReal      *sing;
18a13144ffSStefano Zampini   PetscBLASInt   bM,bN,lwork,lierr,di = 1;
19a13144ffSStefano Zampini   PetscInt       ulw,i,nr,nc,n;
20a13144ffSStefano Zampini   PetscErrorCode ierr;
21a13144ffSStefano Zampini 
22a13144ffSStefano Zampini   PetscFunctionBegin;
23a13144ffSStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
24a13144ffSStefano Zampini   SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"LAPACK _GESVD not available");
25614dbb09SStefano Zampini #else
26a13144ffSStefano Zampini   ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr);
27a13144ffSStefano Zampini   if (!nr || !nc) PetscFunctionReturn(0);
28a13144ffSStefano Zampini 
29a13144ffSStefano Zampini   /* workspace */
30a13144ffSStefano Zampini   if (!work) {
31a13144ffSStefano Zampini     ulw  = PetscMax(PetscMax(1,5*PetscMin(nr,nc)),3*PetscMin(nr,nc)+PetscMax(nr,nc));
32f913dca9SStefano Zampini     ierr = PetscMalloc1(ulw,&uwork);CHKERRQ(ierr);
33a13144ffSStefano Zampini   } else {
34a13144ffSStefano Zampini     ulw   = lw;
35a13144ffSStefano Zampini     uwork = work;
36a13144ffSStefano Zampini   }
37a13144ffSStefano Zampini   n = PetscMin(nr,nc);
38a13144ffSStefano Zampini   if (!rwork) {
39a13144ffSStefano Zampini     ierr = PetscMalloc1(n,&sing);CHKERRQ(ierr);
40a13144ffSStefano Zampini   } else {
41a13144ffSStefano Zampini     sing = rwork;
42a13144ffSStefano Zampini   }
43a13144ffSStefano Zampini 
44a13144ffSStefano Zampini   /* SVD */
45a13144ffSStefano Zampini   ierr = PetscMalloc1(nr*nr,&U);CHKERRQ(ierr);
46a13144ffSStefano Zampini   ierr = PetscBLASIntCast(nr,&bM);CHKERRQ(ierr);
47a13144ffSStefano Zampini   ierr = PetscBLASIntCast(nc,&bN);CHKERRQ(ierr);
48a13144ffSStefano Zampini   ierr = PetscBLASIntCast(ulw,&lwork);CHKERRQ(ierr);
49a13144ffSStefano Zampini   ierr = MatDenseGetArray(A,&data);CHKERRQ(ierr);
50a13144ffSStefano Zampini   ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
51a13144ffSStefano Zampini   PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("A","N",&bM,&bN,data,&bM,sing,U,&bM,&ds,&di,uwork,&lwork,&lierr));
52a13144ffSStefano Zampini   ierr = PetscFPTrapPop();CHKERRQ(ierr);
53a13144ffSStefano Zampini   if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESVD Lapack routine %d",(int)lierr);
54a13144ffSStefano Zampini   ierr = MatDenseRestoreArray(A,&data);CHKERRQ(ierr);
55a13144ffSStefano Zampini   for (i=0;i<n;i++) if (sing[i] < PETSC_SMALL) break;
56a13144ffSStefano Zampini   if (!rwork) {
57a13144ffSStefano Zampini     ierr = PetscFree(sing);CHKERRQ(ierr);
58a13144ffSStefano Zampini   }
59a13144ffSStefano Zampini   if (!work) {
60a13144ffSStefano Zampini     ierr = PetscFree(uwork);CHKERRQ(ierr);
61a13144ffSStefano Zampini   }
62a13144ffSStefano Zampini   /* create B */
63f498cd09SStefano Zampini   if (!range) {
64a13144ffSStefano Zampini     ierr = MatCreateSeqDense(PETSC_COMM_SELF,nr,nr-i,NULL,B);CHKERRQ(ierr);
65a13144ffSStefano Zampini     ierr = MatDenseGetArray(*B,&data);CHKERRQ(ierr);
66a13144ffSStefano Zampini     ierr = PetscMemcpy(data,U+nr*i,(nr-i)*nr*sizeof(PetscScalar));CHKERRQ(ierr);
67f498cd09SStefano Zampini   } else {
68f498cd09SStefano Zampini     ierr = MatCreateSeqDense(PETSC_COMM_SELF,nr,i,NULL,B);CHKERRQ(ierr);
69f498cd09SStefano Zampini     ierr = MatDenseGetArray(*B,&data);CHKERRQ(ierr);
70f498cd09SStefano Zampini     ierr = PetscMemcpy(data,U,i*nr*sizeof(PetscScalar));CHKERRQ(ierr);
71f498cd09SStefano Zampini   }
72a13144ffSStefano Zampini   ierr = MatDenseRestoreArray(*B,&data);CHKERRQ(ierr);
73a13144ffSStefano Zampini   ierr = PetscFree(U);CHKERRQ(ierr);
74614dbb09SStefano Zampini #endif
75614dbb09SStefano Zampini #else /* PETSC_USE_COMPLEX */
76a13144ffSStefano Zampini   PetscFunctionBegin;
77a13144ffSStefano Zampini   SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented for complexes");
78a13144ffSStefano Zampini #endif
79a13144ffSStefano Zampini   PetscFunctionReturn(0);
80a13144ffSStefano Zampini }
81a13144ffSStefano Zampini 
821e0482f5SStefano Zampini /* TODO REMOVE */
831e0482f5SStefano Zampini #if defined(PRINT_GDET)
841e0482f5SStefano Zampini static int inc = 0;
851e0482f5SStefano Zampini static int lev = 0;
861e0482f5SStefano Zampini #endif
871e0482f5SStefano Zampini 
881e0482f5SStefano Zampini PetscErrorCode PCBDDCComputeNedelecChangeEdge(Mat lG, IS edge, IS extrow, IS extcol, IS corners, Mat* Gins, Mat* GKins, PetscScalar cvals[2], PetscScalar *work, PetscReal *rwork)
89a13144ffSStefano Zampini {
90a13144ffSStefano Zampini   PetscErrorCode ierr;
91a13144ffSStefano Zampini   Mat            GE,GEd;
92a13144ffSStefano Zampini   PetscInt       rsize,csize,esize;
93a13144ffSStefano Zampini   PetscScalar    *ptr;
94a13144ffSStefano Zampini 
95a13144ffSStefano Zampini   PetscFunctionBegin;
96a13144ffSStefano Zampini   ierr = ISGetSize(edge,&esize);CHKERRQ(ierr);
97c3c0e390SStefano Zampini   if (!esize) PetscFunctionReturn(0);
98a13144ffSStefano Zampini   ierr = ISGetSize(extrow,&rsize);CHKERRQ(ierr);
99a13144ffSStefano Zampini   ierr = ISGetSize(extcol,&csize);CHKERRQ(ierr);
100a13144ffSStefano Zampini 
101a13144ffSStefano Zampini   /* gradients */
102a13144ffSStefano Zampini   ptr  = work + 5*esize;
1037dae84e0SHong Zhang   ierr = MatCreateSubMatrix(lG,extrow,extcol,MAT_INITIAL_MATRIX,&GE);CHKERRQ(ierr);
104a13144ffSStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,rsize,csize,ptr,Gins);CHKERRQ(ierr);
105a13144ffSStefano Zampini   ierr = MatConvert(GE,MATSEQDENSE,MAT_REUSE_MATRIX,Gins);CHKERRQ(ierr);
106a13144ffSStefano Zampini   ierr = MatDestroy(&GE);CHKERRQ(ierr);
107a13144ffSStefano Zampini 
108a13144ffSStefano Zampini   /* constants */
109a13144ffSStefano Zampini   ptr += rsize*csize;
110a13144ffSStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,esize,csize,ptr,&GEd);CHKERRQ(ierr);
1117dae84e0SHong Zhang   ierr = MatCreateSubMatrix(lG,edge,extcol,MAT_INITIAL_MATRIX,&GE);CHKERRQ(ierr);
112a13144ffSStefano Zampini   ierr = MatConvert(GE,MATSEQDENSE,MAT_REUSE_MATRIX,&GEd);CHKERRQ(ierr);
113a13144ffSStefano Zampini   ierr = MatDestroy(&GE);CHKERRQ(ierr);
114f498cd09SStefano Zampini   ierr = MatDenseOrthogonalRangeOrComplement(GEd,PETSC_FALSE,5*esize,work,rwork,GKins);CHKERRQ(ierr);
115a13144ffSStefano Zampini   ierr = MatDestroy(&GEd);CHKERRQ(ierr);
1161e0482f5SStefano Zampini 
1171e0482f5SStefano Zampini   if (corners) {
1181e0482f5SStefano Zampini     Mat            GEc;
1191e0482f5SStefano Zampini     PetscScalar    *vals,v;
1201e0482f5SStefano Zampini 
1217dae84e0SHong Zhang     ierr = MatCreateSubMatrix(lG,edge,corners,MAT_INITIAL_MATRIX,&GEc);CHKERRQ(ierr);
1221e0482f5SStefano Zampini     ierr = MatTransposeMatMult(GEc,*GKins,MAT_INITIAL_MATRIX,1.0,&GEd);CHKERRQ(ierr);
1231e0482f5SStefano Zampini     ierr = MatDenseGetArray(GEd,&vals);CHKERRQ(ierr);
124637e8532SStefano Zampini     /* v    = PetscAbsScalar(vals[0]) */;
125637e8532SStefano Zampini     v    = 1.;
1261e0482f5SStefano Zampini     cvals[0] = vals[0]/v;
1271e0482f5SStefano Zampini     cvals[1] = vals[1]/v;
1281e0482f5SStefano Zampini     ierr = MatDenseRestoreArray(GEd,&vals);CHKERRQ(ierr);
1291e0482f5SStefano Zampini     ierr = MatScale(*GKins,1./v);CHKERRQ(ierr);
1301e0482f5SStefano Zampini #if defined(PRINT_GDET)
1311e0482f5SStefano Zampini     {
1321e0482f5SStefano Zampini       PetscViewer viewer;
1331e0482f5SStefano Zampini       char filename[256];
1341e0482f5SStefano Zampini       sprintf(filename,"Gdet_l%d_r%d_cc%d.m",lev,PetscGlobalRank,inc++);
1351e0482f5SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&viewer);CHKERRQ(ierr);
1361e0482f5SStefano Zampini       ierr = PetscViewerPushFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
1371e0482f5SStefano Zampini       ierr = PetscObjectSetName((PetscObject)GEc,"GEc");CHKERRQ(ierr);
1381e0482f5SStefano Zampini       ierr = MatView(GEc,viewer);CHKERRQ(ierr);
1391e0482f5SStefano Zampini       ierr = PetscObjectSetName((PetscObject)(*GKins),"GK");CHKERRQ(ierr);
1401e0482f5SStefano Zampini       ierr = MatView(*GKins,viewer);CHKERRQ(ierr);
1411e0482f5SStefano Zampini       ierr = PetscObjectSetName((PetscObject)GEd,"Gproj");CHKERRQ(ierr);
1421e0482f5SStefano Zampini       ierr = MatView(GEd,viewer);CHKERRQ(ierr);
1431e0482f5SStefano Zampini       ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr);
1441e0482f5SStefano Zampini     }
1451e0482f5SStefano Zampini #endif
1461e0482f5SStefano Zampini     ierr = MatDestroy(&GEd);CHKERRQ(ierr);
1471e0482f5SStefano Zampini     ierr = MatDestroy(&GEc);CHKERRQ(ierr);
1481e0482f5SStefano Zampini   }
1491e0482f5SStefano Zampini 
150a13144ffSStefano Zampini   PetscFunctionReturn(0);
151a13144ffSStefano Zampini }
152a13144ffSStefano Zampini 
153a13144ffSStefano Zampini PetscErrorCode PCBDDCNedelecSupport(PC pc)
154a13144ffSStefano Zampini {
155a13144ffSStefano Zampini   PC_BDDC                *pcbddc = (PC_BDDC*)pc->data;
156a13144ffSStefano Zampini   Mat_IS                 *matis = (Mat_IS*)pc->pmat->data;
1570569b399SStefano Zampini   Mat                    G,T,conn,lG,lGt,lGis,lGall,lGe,lGinit;
158eee23b56SStefano Zampini   Vec                    tvec;
159a13144ffSStefano Zampini   PetscSF                sfv;
1601e0482f5SStefano Zampini   ISLocalToGlobalMapping el2g,vl2g,fl2g,al2g;
161a13144ffSStefano Zampini   MPI_Comm               comm;
162c2151214SStefano Zampini   IS                     lned,primals,allprimals,nedfieldlocal;
163c2151214SStefano Zampini   IS                     *eedges,*extrows,*extcols,*alleedges;
1647d871cd7SStefano Zampini   PetscBT                btv,bte,btvc,btb,btbd,btvcand,btvi,btee,bter;
165a13144ffSStefano Zampini   PetscScalar            *vals,*work;
166a13144ffSStefano Zampini   PetscReal              *rwork;
167a13144ffSStefano Zampini   const PetscInt         *idxs,*ii,*jj,*iit,*jjt;
1681e0482f5SStefano Zampini   PetscInt               ne,nv,Lv,order,n,field;
169a13144ffSStefano Zampini   PetscInt               n_neigh,*neigh,*n_shared,**shared;
170eee23b56SStefano Zampini   PetscInt               i,j,extmem,cum,maxsize,nee;
171b03ebc13SStefano Zampini   PetscInt               *extrow,*extrowcum,*marks,*vmarks,*gidxs;
172a13144ffSStefano Zampini   PetscInt               *sfvleaves,*sfvroots;
173b03ebc13SStefano Zampini   PetscInt               *corners,*cedges;
174637e8532SStefano Zampini   PetscInt               *ecount,**eneighs,*vcount,**vneighs;
175b03ebc13SStefano Zampini #if defined(PETSC_USE_DEBUG)
176b03ebc13SStefano Zampini   PetscInt               *emarks;
177b03ebc13SStefano Zampini #endif
178213b8bfaSStefano Zampini   PetscBool              print,eerr,done,lrc[2],conforming,global,singular,setprimal;
179a13144ffSStefano Zampini   PetscErrorCode         ierr;
180a13144ffSStefano Zampini 
181a13144ffSStefano Zampini   PetscFunctionBegin;
182213b8bfaSStefano Zampini   /* If the discrete gradient is defined for a subset of dofs and global is true,
183213b8bfaSStefano Zampini      it assumes G is given in global ordering for all the dofs.
184213b8bfaSStefano Zampini      Otherwise, the ordering is global for the Nedelec field */
185213b8bfaSStefano Zampini   order      = pcbddc->nedorder;
186213b8bfaSStefano Zampini   conforming = pcbddc->conforming;
187213b8bfaSStefano Zampini   field      = pcbddc->nedfield;
188213b8bfaSStefano Zampini   global     = pcbddc->nedglobal;
189213b8bfaSStefano Zampini   setprimal  = PETSC_FALSE;
190a13144ffSStefano Zampini   print      = PETSC_FALSE;
191213b8bfaSStefano Zampini   singular   = PETSC_FALSE;
192a13144ffSStefano Zampini 
193213b8bfaSStefano Zampini   /* Command line customization */
194213b8bfaSStefano Zampini   ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC Nedelec options","PC");CHKERRQ(ierr);
195213b8bfaSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_nedelec_field_primal","All edge dofs set as primals: Toselli's algorithm C",NULL,setprimal,&setprimal,NULL);CHKERRQ(ierr);
196213b8bfaSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_nedelec_singular","Infer nullspace from discrete gradient",NULL,singular,&singular,NULL);CHKERRQ(ierr);
197213b8bfaSStefano Zampini   ierr = PetscOptionsInt("-pc_bddc_nedelec_order","Test variable order code (to be removed)",NULL,order,&order,NULL);CHKERRQ(ierr);
198213b8bfaSStefano Zampini   /* print debug info TODO: to be removed */
199213b8bfaSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_nedelec_print","Print debug info",NULL,print,&print,NULL);CHKERRQ(ierr);
200213b8bfaSStefano Zampini   ierr = PetscOptionsEnd();CHKERRQ(ierr);
201213b8bfaSStefano Zampini 
202213b8bfaSStefano Zampini   /* Return if there are no edges in the decomposition and the problem is not singular */
2031e0482f5SStefano Zampini   ierr = MatGetLocalToGlobalMapping(pc->pmat,&al2g,NULL);CHKERRQ(ierr);
2041e0482f5SStefano Zampini   ierr = ISLocalToGlobalMappingGetSize(al2g,&n);CHKERRQ(ierr);
205213b8bfaSStefano Zampini   ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr);
206213b8bfaSStefano Zampini   if (!singular) {
207a13144ffSStefano Zampini     ierr   = VecGetArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr);
208a13144ffSStefano Zampini     lrc[0] = PETSC_FALSE;
209c2151214SStefano Zampini     for (i=0;i<n;i++) {
210a13144ffSStefano Zampini       if (PetscRealPart(vals[i]) > 2.) {
211a13144ffSStefano Zampini         lrc[0] = PETSC_TRUE;
212a13144ffSStefano Zampini         break;
213a13144ffSStefano Zampini       }
214a13144ffSStefano Zampini     }
215a13144ffSStefano Zampini     ierr = VecRestoreArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr);
216a13144ffSStefano Zampini     ierr = MPIU_Allreduce(&lrc[0],&lrc[1],1,MPIU_BOOL,MPI_LOR,comm);CHKERRQ(ierr);
217a13144ffSStefano Zampini     if (!lrc[1]) PetscFunctionReturn(0);
218213b8bfaSStefano Zampini   }
219a13144ffSStefano Zampini 
220213b8bfaSStefano Zampini   /* Get Nedelec field */
221213b8bfaSStefano Zampini   ierr = MatISSetUpSF(pc->pmat);CHKERRQ(ierr);
222c2151214SStefano Zampini   if (pcbddc->n_ISForDofsLocal && field >= pcbddc->n_ISForDofsLocal) SETERRQ2(comm,PETSC_ERR_USER,"Invalid field for Nedelec %d: number of fields is %d",field,pcbddc->n_ISForDofsLocal);
223213b8bfaSStefano Zampini   if (pcbddc->n_ISForDofsLocal && field >= 0) {
224c2151214SStefano Zampini     ierr          = PetscObjectReference((PetscObject)pcbddc->ISForDofsLocal[field]);CHKERRQ(ierr);
225c2151214SStefano Zampini     nedfieldlocal = pcbddc->ISForDofsLocal[field];
226c2151214SStefano Zampini     ierr          = ISGetLocalSize(nedfieldlocal,&ne);CHKERRQ(ierr);
227213b8bfaSStefano Zampini   } else if (!pcbddc->n_ISForDofsLocal && field != PETSC_DECIDE) {
228213b8bfaSStefano Zampini     ne            = n;
229213b8bfaSStefano Zampini     nedfieldlocal = NULL;
230213b8bfaSStefano Zampini     global        = PETSC_TRUE;
231213b8bfaSStefano Zampini   } else if (field == PETSC_DECIDE) {
232213b8bfaSStefano Zampini     PetscInt rst,ren,*idx;
233213b8bfaSStefano Zampini 
234213b8bfaSStefano Zampini     ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscInt));CHKERRQ(ierr);
235213b8bfaSStefano Zampini     ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
236213b8bfaSStefano Zampini     ierr = MatGetOwnershipRange(pcbddc->discretegradient,&rst,&ren);CHKERRQ(ierr);
237213b8bfaSStefano Zampini     for (i=rst;i<ren;i++) {
238213b8bfaSStefano Zampini       PetscInt nc;
239213b8bfaSStefano Zampini 
240213b8bfaSStefano Zampini       ierr = MatGetRow(pcbddc->discretegradient,i,&nc,NULL,NULL);CHKERRQ(ierr);
241213b8bfaSStefano Zampini       if (nc > 1) matis->sf_rootdata[i-rst] = 1;
242213b8bfaSStefano Zampini       ierr = MatRestoreRow(pcbddc->discretegradient,i,&nc,NULL,NULL);CHKERRQ(ierr);
243213b8bfaSStefano Zampini     }
244213b8bfaSStefano Zampini     ierr = PetscSFBcastBegin(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr);
245213b8bfaSStefano Zampini     ierr = PetscSFBcastEnd(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr);
246213b8bfaSStefano Zampini     ierr = PetscMalloc1(n,&idx);CHKERRQ(ierr);
247213b8bfaSStefano Zampini     for (i=0,ne=0;i<n;i++) if (matis->sf_leafdata[i]) idx[ne++] = i;
248213b8bfaSStefano Zampini     ierr = ISCreateGeneral(comm,ne,idx,PETSC_OWN_POINTER,&nedfieldlocal);CHKERRQ(ierr);
249213b8bfaSStefano Zampini   } else {
250213b8bfaSStefano Zampini     SETERRQ(comm,PETSC_ERR_USER,"When multiple fields are present, the Nedelec field has to be specified");
251213b8bfaSStefano Zampini   }
252213b8bfaSStefano Zampini 
253213b8bfaSStefano Zampini   /* Sanity checks */
254213b8bfaSStefano Zampini   if (!order && !conforming) SETERRQ(comm,PETSC_ERR_SUP,"Variable order and non-conforming spaces are not supported at the same time");
255213b8bfaSStefano Zampini   if (pcbddc->user_ChangeOfBasisMatrix) SETERRQ(comm,PETSC_ERR_SUP,"Cannot generate Nedelec support with user defined change of basis");
256213b8bfaSStefano Zampini   if (order && ne%order) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"The number of local edge dofs %d it's not a multiple of the order %d",ne,order);
257213b8bfaSStefano Zampini 
258213b8bfaSStefano Zampini   /* Just set primal dofs and return */
2591e0482f5SStefano Zampini   if (setprimal) {
260eee23b56SStefano Zampini     IS       enedfieldlocal;
261eee23b56SStefano Zampini     PetscInt *eidxs;
262eee23b56SStefano Zampini 
263eee23b56SStefano Zampini     ierr = PetscMalloc1(ne,&eidxs);CHKERRQ(ierr);
264eee23b56SStefano Zampini     ierr = VecGetArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr);
265213b8bfaSStefano Zampini     if (nedfieldlocal) {
266213b8bfaSStefano Zampini       ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
267eee23b56SStefano Zampini       for (i=0,cum=0;i<ne;i++) {
268eee23b56SStefano Zampini         if (PetscRealPart(vals[idxs[i]]) > 2.) {
269eee23b56SStefano Zampini           eidxs[cum++] = idxs[i];
270eee23b56SStefano Zampini         }
271eee23b56SStefano Zampini       }
272eee23b56SStefano Zampini       ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
273213b8bfaSStefano Zampini     } else {
274213b8bfaSStefano Zampini       for (i=0,cum=0;i<ne;i++) {
275213b8bfaSStefano Zampini         if (PetscRealPart(vals[i]) > 2.) {
276213b8bfaSStefano Zampini           eidxs[cum++] = i;
277213b8bfaSStefano Zampini         }
278213b8bfaSStefano Zampini       }
279213b8bfaSStefano Zampini     }
280213b8bfaSStefano Zampini     ierr = VecRestoreArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr);
281eee23b56SStefano Zampini     ierr = ISCreateGeneral(comm,cum,eidxs,PETSC_COPY_VALUES,&enedfieldlocal);CHKERRQ(ierr);
282eee23b56SStefano Zampini     ierr = PCBDDCSetPrimalVerticesLocalIS(pc,enedfieldlocal);CHKERRQ(ierr);
283eee23b56SStefano Zampini     ierr = PetscFree(eidxs);CHKERRQ(ierr);
2841e0482f5SStefano Zampini     ierr = ISDestroy(&nedfieldlocal);CHKERRQ(ierr);
285eee23b56SStefano Zampini     ierr = ISDestroy(&enedfieldlocal);CHKERRQ(ierr);
2861e0482f5SStefano Zampini     PetscFunctionReturn(0);
2871e0482f5SStefano Zampini   }
288a13144ffSStefano Zampini 
289213b8bfaSStefano Zampini   /* Compute some l2g maps */
290213b8bfaSStefano Zampini   if (nedfieldlocal) {
291c2151214SStefano Zampini     IS is;
292c2151214SStefano Zampini 
293c2151214SStefano Zampini     /* need to map from the local Nedelec field to local numbering */
294c2151214SStefano Zampini     ierr = ISLocalToGlobalMappingCreateIS(nedfieldlocal,&fl2g);CHKERRQ(ierr);
2951e0482f5SStefano Zampini     /* need to map from the local Nedelec field to global numbering for the whole dofs*/
2961e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingApplyIS(al2g,nedfieldlocal,&is);CHKERRQ(ierr);
2971e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingCreateIS(is,&al2g);CHKERRQ(ierr);
2981e0482f5SStefano Zampini     /* need to map from the local Nedelec field to global numbering (for Nedelec only) */
2991e0482f5SStefano Zampini     if (global) {
3001e0482f5SStefano Zampini       ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr);
3011e0482f5SStefano Zampini       el2g = al2g;
3021e0482f5SStefano Zampini     } else {
3031e0482f5SStefano Zampini       IS gis;
3041e0482f5SStefano Zampini 
3051e0482f5SStefano Zampini       ierr = ISRenumber(is,NULL,NULL,&gis);CHKERRQ(ierr);
3061e0482f5SStefano Zampini       ierr = ISLocalToGlobalMappingCreateIS(gis,&el2g);CHKERRQ(ierr);
3071e0482f5SStefano Zampini       ierr = ISDestroy(&gis);CHKERRQ(ierr);
3081e0482f5SStefano Zampini     }
309c2151214SStefano Zampini     ierr = ISDestroy(&is);CHKERRQ(ierr);
310c2151214SStefano Zampini   } else {
3111e0482f5SStefano Zampini     /* restore default */
3121e0482f5SStefano Zampini     pcbddc->nedfield = -1;
3131e0482f5SStefano Zampini     /* one ref for the destruction of al2g, one for el2g */
3141e0482f5SStefano Zampini     ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr);
3151e0482f5SStefano Zampini     ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr);
3161e0482f5SStefano Zampini     el2g = al2g;
317c2151214SStefano Zampini     fl2g = NULL;
318c2151214SStefano Zampini   }
319a13144ffSStefano Zampini 
320213b8bfaSStefano Zampini   /* Start communication to drop connections for interior edges (for cc analysis only) */
321c2151214SStefano Zampini   ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscInt));CHKERRQ(ierr);
322c2151214SStefano Zampini   ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
323c2151214SStefano Zampini   if (nedfieldlocal) {
324c2151214SStefano Zampini     ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
325c2151214SStefano Zampini     for (i=0;i<ne;i++) matis->sf_leafdata[idxs[i]] = 1;
326c2151214SStefano Zampini     ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
327c2151214SStefano Zampini   } else {
328c2151214SStefano Zampini     for (i=0;i<ne;i++) matis->sf_leafdata[i] = 1;
329c2151214SStefano Zampini   }
330c2151214SStefano Zampini   ierr = PetscSFReduceBegin(matis->sf,MPIU_INT,matis->sf_leafdata,matis->sf_rootdata,MPI_SUM);CHKERRQ(ierr);
331c2151214SStefano Zampini   ierr = PetscSFReduceEnd(matis->sf,MPIU_INT,matis->sf_leafdata,matis->sf_rootdata,MPI_SUM);CHKERRQ(ierr);
332213b8bfaSStefano Zampini 
333213b8bfaSStefano Zampini   if (!singular) { /* drop connections with interior edges to avoid unneeded communications and memory movements */
334213b8bfaSStefano Zampini     ierr = MatDuplicate(pcbddc->discretegradient,MAT_COPY_VALUES,&G);CHKERRQ(ierr);
335213b8bfaSStefano Zampini     ierr = MatSetOption(G,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr);
3361e0482f5SStefano Zampini     if (global) {
3371e0482f5SStefano Zampini       PetscInt rst;
3381e0482f5SStefano Zampini 
339c2151214SStefano Zampini       ierr = MatGetOwnershipRange(G,&rst,NULL);CHKERRQ(ierr);
340c2151214SStefano Zampini       for (i=0,cum=0;i<pc->pmat->rmap->n;i++) {
341c2151214SStefano Zampini         if (matis->sf_rootdata[i] < 2) {
342c2151214SStefano Zampini           matis->sf_rootdata[cum++] = i + rst;
343c2151214SStefano Zampini         }
344c2151214SStefano Zampini       }
345a13144ffSStefano Zampini       ierr = MatSetOption(G,MAT_NO_OFF_PROC_ZERO_ROWS,PETSC_TRUE);CHKERRQ(ierr);
346c2151214SStefano Zampini       ierr = MatZeroRows(G,cum,matis->sf_rootdata,0.,NULL,NULL);CHKERRQ(ierr);
3471e0482f5SStefano Zampini     } else {
3481e0482f5SStefano Zampini       PetscInt *tbz;
3491e0482f5SStefano Zampini 
3501e0482f5SStefano Zampini       ierr = PetscMalloc1(ne,&tbz);CHKERRQ(ierr);
3511e0482f5SStefano Zampini       ierr = PetscSFBcastBegin(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr);
3521e0482f5SStefano Zampini       ierr = PetscSFBcastEnd(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr);
3531e0482f5SStefano Zampini       ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
3541e0482f5SStefano Zampini       for (i=0,cum=0;i<ne;i++)
3551e0482f5SStefano Zampini         if (matis->sf_leafdata[idxs[i]] == 1)
3561e0482f5SStefano Zampini           tbz[cum++] = i;
3571e0482f5SStefano Zampini       ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
3581e0482f5SStefano Zampini       ierr = ISLocalToGlobalMappingApply(el2g,cum,tbz,tbz);CHKERRQ(ierr);
3591e0482f5SStefano Zampini       ierr = MatZeroRows(G,cum,tbz,0.,NULL,NULL);CHKERRQ(ierr);
3601e0482f5SStefano Zampini       ierr = PetscFree(tbz);CHKERRQ(ierr);
3611e0482f5SStefano Zampini     }
362213b8bfaSStefano Zampini   } else { /* we need the entire G to infer the nullspace */
363213b8bfaSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->discretegradient);CHKERRQ(ierr);
364213b8bfaSStefano Zampini     G    = pcbddc->discretegradient;
365213b8bfaSStefano Zampini   }
366a13144ffSStefano Zampini 
367a13144ffSStefano Zampini   /* Extract subdomain relevant rows of G */
368a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingGetIndices(el2g,&idxs);CHKERRQ(ierr);
369a13144ffSStefano Zampini   ierr = ISCreateGeneral(comm,ne,idxs,PETSC_USE_POINTER,&lned);CHKERRQ(ierr);
3707dae84e0SHong Zhang   ierr = MatCreateSubMatrix(G,lned,NULL,MAT_INITIAL_MATRIX,&lGall);CHKERRQ(ierr);
371a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingRestoreIndices(el2g,&idxs);CHKERRQ(ierr);
372a13144ffSStefano Zampini   ierr = ISDestroy(&lned);CHKERRQ(ierr);
373a13144ffSStefano Zampini   ierr = MatConvert(lGall,MATIS,MAT_INITIAL_MATRIX,&lGis);CHKERRQ(ierr);
374a13144ffSStefano Zampini   ierr = MatDestroy(&lGall);CHKERRQ(ierr);
375a13144ffSStefano Zampini   ierr = MatISGetLocalMat(lGis,&lG);CHKERRQ(ierr);
376a13144ffSStefano Zampini 
377213b8bfaSStefano Zampini   /* SF for nodal dofs communications */
378c2151214SStefano Zampini   ierr = MatGetLocalSize(G,NULL,&Lv);CHKERRQ(ierr);
379a13144ffSStefano Zampini   ierr = MatGetLocalToGlobalMapping(lGis,NULL,&vl2g);CHKERRQ(ierr);
380a13144ffSStefano Zampini   ierr = PetscObjectReference((PetscObject)vl2g);CHKERRQ(ierr);
381a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingGetSize(vl2g,&nv);CHKERRQ(ierr);
382a13144ffSStefano Zampini   ierr = PetscSFCreate(comm,&sfv);CHKERRQ(ierr);
383a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingGetIndices(vl2g,&idxs);CHKERRQ(ierr);
384a13144ffSStefano Zampini   ierr = PetscSFSetGraphLayout(sfv,lGis->cmap,nv,NULL,PETSC_OWN_POINTER,idxs);CHKERRQ(ierr);
385a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingRestoreIndices(vl2g,&idxs);CHKERRQ(ierr);
386213b8bfaSStefano Zampini   i    = singular ? 2 : 1;
387213b8bfaSStefano Zampini   ierr = PetscMalloc2(i*nv,&sfvleaves,i*Lv,&sfvroots);CHKERRQ(ierr);
388a13144ffSStefano Zampini 
3891e0482f5SStefano Zampini   /* Destroy temporary G created in MATIS format and modified G */
390213b8bfaSStefano Zampini   ierr = PetscObjectReference((PetscObject)lG);CHKERRQ(ierr);
391a13144ffSStefano Zampini   ierr = MatDestroy(&lGis);CHKERRQ(ierr);
392213b8bfaSStefano Zampini   ierr = MatDestroy(&G);CHKERRQ(ierr);
393a13144ffSStefano Zampini 
394213b8bfaSStefano Zampini   if (print) {
395213b8bfaSStefano Zampini     ierr = PetscObjectSetName((PetscObject)lG,"initial_lG");CHKERRQ(ierr);
396213b8bfaSStefano Zampini     ierr = MatView(lG,NULL);CHKERRQ(ierr);
397213b8bfaSStefano Zampini   }
398213b8bfaSStefano Zampini 
399213b8bfaSStefano Zampini   /* Save lG for values insertion in change of basis */
4000569b399SStefano Zampini   ierr = MatDuplicate(lG,MAT_COPY_VALUES,&lGinit);CHKERRQ(ierr);
4010569b399SStefano Zampini 
402a13144ffSStefano Zampini   /* Analyze the edge-nodes connections (duplicate lG) */
4034e64d54eSstefano_zampini   ierr = MatDuplicate(lG,MAT_COPY_VALUES,&lGe);CHKERRQ(ierr);
4044e64d54eSstefano_zampini   ierr = MatSetOption(lGe,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr);
405a13144ffSStefano Zampini   ierr = PetscBTCreate(nv,&btv);CHKERRQ(ierr);
406a13144ffSStefano Zampini   ierr = PetscBTCreate(ne,&bte);CHKERRQ(ierr);
407a13144ffSStefano Zampini   ierr = PetscBTCreate(ne,&btb);CHKERRQ(ierr);
4087d871cd7SStefano Zampini   ierr = PetscBTCreate(ne,&btbd);CHKERRQ(ierr);
409c2151214SStefano Zampini   ierr = PetscBTCreate(nv,&btvcand);CHKERRQ(ierr);
410a13144ffSStefano Zampini   /* need to import the boundary specification to ensure the
411a13144ffSStefano Zampini      proper detection of coarse edges' endpoints */
412a13144ffSStefano Zampini   if (pcbddc->DirichletBoundariesLocal) {
413c2151214SStefano Zampini     IS is;
414c2151214SStefano Zampini 
415c2151214SStefano Zampini     if (fl2g) {
416c2151214SStefano Zampini       ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_MASK,pcbddc->DirichletBoundariesLocal,&is);CHKERRQ(ierr);
417c2151214SStefano Zampini     } else {
418c2151214SStefano Zampini       is = pcbddc->DirichletBoundariesLocal;
419c2151214SStefano Zampini     }
420c2151214SStefano Zampini     ierr = ISGetLocalSize(is,&cum);CHKERRQ(ierr);
421c2151214SStefano Zampini     ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr);
422a13144ffSStefano Zampini     for (i=0;i<cum;i++) {
423a13144ffSStefano Zampini       if (idxs[i] >= 0) {
424a13144ffSStefano Zampini         ierr = PetscBTSet(btb,idxs[i]);CHKERRQ(ierr);
4257d871cd7SStefano Zampini         ierr = PetscBTSet(btbd,idxs[i]);CHKERRQ(ierr);
426a13144ffSStefano Zampini       }
427a13144ffSStefano Zampini     }
428c2151214SStefano Zampini     ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr);
429c2151214SStefano Zampini     if (fl2g) {
430c2151214SStefano Zampini       ierr = ISDestroy(&is);CHKERRQ(ierr);
431c2151214SStefano Zampini     }
432a13144ffSStefano Zampini   }
433a13144ffSStefano Zampini   if (pcbddc->NeumannBoundariesLocal) {
434c2151214SStefano Zampini     IS is;
435c2151214SStefano Zampini 
436c2151214SStefano Zampini     if (fl2g) {
437c2151214SStefano Zampini       ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_MASK,pcbddc->NeumannBoundariesLocal,&is);CHKERRQ(ierr);
438c2151214SStefano Zampini     } else {
439c2151214SStefano Zampini       is = pcbddc->NeumannBoundariesLocal;
440c2151214SStefano Zampini     }
441c2151214SStefano Zampini     ierr = ISGetLocalSize(is,&cum);CHKERRQ(ierr);
442c2151214SStefano Zampini     ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr);
443a13144ffSStefano Zampini     for (i=0;i<cum;i++) {
444a13144ffSStefano Zampini       if (idxs[i] >= 0) {
445a13144ffSStefano Zampini         ierr = PetscBTSet(btb,idxs[i]);CHKERRQ(ierr);
446a13144ffSStefano Zampini       }
447a13144ffSStefano Zampini     }
448c2151214SStefano Zampini     ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr);
449c2151214SStefano Zampini     if (fl2g) {
450c2151214SStefano Zampini       ierr = ISDestroy(&is);CHKERRQ(ierr);
451a13144ffSStefano Zampini     }
452c2151214SStefano Zampini   }
453c2151214SStefano Zampini 
454213b8bfaSStefano Zampini   /* Count neighs per dof */
455637e8532SStefano Zampini   ierr = PetscCalloc1(ne,&ecount);CHKERRQ(ierr);
456637e8532SStefano Zampini   ierr = PetscMalloc1(ne,&eneighs);CHKERRQ(ierr);
457637e8532SStefano Zampini   ierr = ISLocalToGlobalMappingGetInfo(el2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
458637e8532SStefano Zampini   for (i=1,cum=0;i<n_neigh;i++) {
459637e8532SStefano Zampini     cum += n_shared[i];
460637e8532SStefano Zampini     for (j=0;j<n_shared[i];j++) {
461637e8532SStefano Zampini       ecount[shared[i][j]]++;
462637e8532SStefano Zampini     }
463637e8532SStefano Zampini   }
464637e8532SStefano Zampini   if (ne) {
465637e8532SStefano Zampini     ierr = PetscMalloc1(cum,&eneighs[0]);CHKERRQ(ierr);
466637e8532SStefano Zampini   }
467637e8532SStefano Zampini   for (i=1;i<ne;i++) eneighs[i] = eneighs[i-1] + ecount[i-1];
468637e8532SStefano Zampini   ierr = PetscMemzero(ecount,ne*sizeof(PetscInt));CHKERRQ(ierr);
469637e8532SStefano Zampini   for (i=1;i<n_neigh;i++) {
470637e8532SStefano Zampini     for (j=0;j<n_shared[i];j++) {
471637e8532SStefano Zampini       PetscInt k = shared[i][j];
472637e8532SStefano Zampini       eneighs[k][ecount[k]] = neigh[i];
473637e8532SStefano Zampini       ecount[k]++;
474637e8532SStefano Zampini     }
475637e8532SStefano Zampini   }
476637e8532SStefano Zampini   for (i=0;i<ne;i++) {
477637e8532SStefano Zampini     ierr = PetscSortRemoveDupsInt(&ecount[i],eneighs[i]);CHKERRQ(ierr);
478637e8532SStefano Zampini   }
479637e8532SStefano Zampini   ierr = ISLocalToGlobalMappingRestoreInfo(el2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
480637e8532SStefano Zampini   ierr = PetscCalloc1(nv,&vcount);CHKERRQ(ierr);
481637e8532SStefano Zampini   ierr = PetscMalloc1(nv,&vneighs);CHKERRQ(ierr);
482637e8532SStefano Zampini   ierr = ISLocalToGlobalMappingGetInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
483637e8532SStefano Zampini   for (i=1,cum=0;i<n_neigh;i++) {
484637e8532SStefano Zampini     cum += n_shared[i];
485637e8532SStefano Zampini     for (j=0;j<n_shared[i];j++) {
486637e8532SStefano Zampini       vcount[shared[i][j]]++;
487637e8532SStefano Zampini     }
488637e8532SStefano Zampini   }
489637e8532SStefano Zampini   if (nv) {
490637e8532SStefano Zampini     ierr = PetscMalloc1(cum,&vneighs[0]);CHKERRQ(ierr);
491637e8532SStefano Zampini   }
492637e8532SStefano Zampini   for (i=1;i<nv;i++) vneighs[i] = vneighs[i-1] + vcount[i-1];
493637e8532SStefano Zampini   ierr = PetscMemzero(vcount,nv*sizeof(PetscInt));CHKERRQ(ierr);
494637e8532SStefano Zampini   for (i=1;i<n_neigh;i++) {
495637e8532SStefano Zampini     for (j=0;j<n_shared[i];j++) {
496637e8532SStefano Zampini       PetscInt k = shared[i][j];
497637e8532SStefano Zampini       vneighs[k][vcount[k]] = neigh[i];
498637e8532SStefano Zampini       vcount[k]++;
499637e8532SStefano Zampini     }
500637e8532SStefano Zampini   }
501637e8532SStefano Zampini   for (i=0;i<nv;i++) {
502637e8532SStefano Zampini     ierr = PetscSortRemoveDupsInt(&vcount[i],vneighs[i]);CHKERRQ(ierr);
503637e8532SStefano Zampini   }
504637e8532SStefano Zampini   ierr = ISLocalToGlobalMappingRestoreInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
505637e8532SStefano Zampini 
5067d871cd7SStefano Zampini   /* need to remove coarse faces' dofs and coarse edges' dirichlet dofs
5077d871cd7SStefano Zampini      for proper detection of coarse edges' endpoints */
50862b0c6f7SStefano Zampini   ierr = PetscBTCreate(ne,&btee);CHKERRQ(ierr);
50962b0c6f7SStefano Zampini   for (i=0;i<ne;i++) {
5107d871cd7SStefano Zampini     if ((ecount[i] > 1 && !PetscBTLookup(btbd,i)) || (ecount[i] == 1 && PetscBTLookup(btb,i))) {
51162b0c6f7SStefano Zampini       ierr = PetscBTSet(btee,i);CHKERRQ(ierr);
51262b0c6f7SStefano Zampini     }
51362b0c6f7SStefano Zampini   }
514637e8532SStefano Zampini   ierr = PetscMalloc1(ne,&marks);CHKERRQ(ierr);
51562b0c6f7SStefano Zampini   if (!conforming) {
51662b0c6f7SStefano Zampini     ierr = MatTranspose(lGe,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr);
51762b0c6f7SStefano Zampini     ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
51862b0c6f7SStefano Zampini   }
5194e64d54eSstefano_zampini   ierr = MatGetRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
520dec27d64SStefano Zampini   ierr = MatSeqAIJGetArray(lGe,&vals);CHKERRQ(ierr);
52162b0c6f7SStefano Zampini   cum  = 0;
522a13144ffSStefano Zampini   for (i=0;i<ne;i++) {
523dec27d64SStefano Zampini     /* eliminate rows corresponding to edge dofs belonging to coarse faces */
52462b0c6f7SStefano Zampini     if (!PetscBTLookup(btee,i)) {
525a13144ffSStefano Zampini       marks[cum++] = i;
526dec27d64SStefano Zampini       continue;
527dec27d64SStefano Zampini     }
528dec27d64SStefano Zampini     /* set badly connected edge dofs as primal */
52962b0c6f7SStefano Zampini     if (!conforming) {
53062b0c6f7SStefano Zampini       if (ii[i+1]-ii[i] != order + 1) { /* every row of G on the coarse edge should list order+1 nodal dofs */
531a13144ffSStefano Zampini         marks[cum++] = i;
532a13144ffSStefano Zampini         ierr = PetscBTSet(bte,i);CHKERRQ(ierr);
533a13144ffSStefano Zampini         for (j=ii[i];j<ii[i+1];j++) {
534a13144ffSStefano Zampini           ierr = PetscBTSet(btv,jj[j]);CHKERRQ(ierr);
535a13144ffSStefano Zampini         }
53662b0c6f7SStefano Zampini       } else {
53762b0c6f7SStefano Zampini         /* every edge dofs should be connected trough a certain number of nodal dofs
53862b0c6f7SStefano Zampini            to other edge dofs belonging to coarse edges
53962b0c6f7SStefano Zampini            - at most 2 endpoints
54062b0c6f7SStefano Zampini            - order-1 interior nodal dofs
54162b0c6f7SStefano Zampini            - no undefined nodal dofs (nconn < order)
54262b0c6f7SStefano Zampini         */
54362b0c6f7SStefano Zampini         PetscInt ends = 0,ints = 0, undef = 0;
54462b0c6f7SStefano Zampini         for (j=ii[i];j<ii[i+1];j++) {
54562b0c6f7SStefano Zampini           PetscInt v = jj[j],k;
54662b0c6f7SStefano Zampini           PetscInt nconn = iit[v+1]-iit[v];
54762b0c6f7SStefano Zampini           for (k=iit[v];k<iit[v+1];k++) if (!PetscBTLookup(btee,jjt[k])) nconn--;
54862b0c6f7SStefano Zampini           if (nconn > order) ends++;
54962b0c6f7SStefano Zampini           else if (nconn == order) ints++;
55062b0c6f7SStefano Zampini           else undef++;
55162b0c6f7SStefano Zampini         }
55262b0c6f7SStefano Zampini         if (undef || ends > 2 || ints != order -1) {
55362b0c6f7SStefano Zampini           marks[cum++] = i;
55462b0c6f7SStefano Zampini           ierr = PetscBTSet(bte,i);CHKERRQ(ierr);
55562b0c6f7SStefano Zampini           for (j=ii[i];j<ii[i+1];j++) {
55662b0c6f7SStefano Zampini             ierr = PetscBTSet(btv,jj[j]);CHKERRQ(ierr);
55762b0c6f7SStefano Zampini           }
55862b0c6f7SStefano Zampini         }
55962b0c6f7SStefano Zampini       }
560a13144ffSStefano Zampini     }
561dec27d64SStefano Zampini     /* We assume the order on the element edge is ii[i+1]-ii[i]-1 */
562dec27d64SStefano Zampini     if (!order && ii[i+1] != ii[i]) {
563dec27d64SStefano Zampini       PetscScalar val = 1./(ii[i+1]-ii[i]-1);
564dec27d64SStefano Zampini       for (j=ii[i];j<ii[i+1];j++) vals[j] = val;
565a13144ffSStefano Zampini     }
566dec27d64SStefano Zampini   }
56762b0c6f7SStefano Zampini   ierr = PetscBTDestroy(&btee);CHKERRQ(ierr);
568dec27d64SStefano Zampini   ierr = MatSeqAIJRestoreArray(lGe,&vals);CHKERRQ(ierr);
5694e64d54eSstefano_zampini   ierr = MatRestoreRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
57062b0c6f7SStefano Zampini   if (!conforming) {
57162b0c6f7SStefano Zampini     ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
57262b0c6f7SStefano Zampini     ierr = MatDestroy(&lGt);CHKERRQ(ierr);
57362b0c6f7SStefano Zampini   }
5744e64d54eSstefano_zampini   ierr = MatZeroRows(lGe,cum,marks,0.,NULL,NULL);CHKERRQ(ierr);
575637e8532SStefano Zampini 
576b03ebc13SStefano Zampini   /* identify splitpoints and corner candidates */
5774e64d54eSstefano_zampini   ierr = MatTranspose(lGe,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr);
578a13144ffSStefano Zampini   if (print) {
5794e64d54eSstefano_zampini     ierr = PetscObjectSetName((PetscObject)lGe,"edgerestr_lG");CHKERRQ(ierr);
5804e64d54eSstefano_zampini     ierr = MatView(lGe,NULL);CHKERRQ(ierr);
5814e64d54eSstefano_zampini     ierr = PetscObjectSetName((PetscObject)lGt,"edgerestr_lGt");CHKERRQ(ierr);
582a13144ffSStefano Zampini     ierr = MatView(lGt,NULL);CHKERRQ(ierr);
583a13144ffSStefano Zampini   }
584a13144ffSStefano Zampini   ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
585dec27d64SStefano Zampini   ierr = MatSeqAIJGetArray(lGt,&vals);CHKERRQ(ierr);
586a13144ffSStefano Zampini   for (i=0;i<nv;i++) {
587637e8532SStefano Zampini     PetscInt  ord = order, test = ii[i+1]-ii[i], vc = vcount[i];
5887d871cd7SStefano Zampini     PetscBool sneighs = PETSC_TRUE, bdir = PETSC_FALSE;
589b03ebc13SStefano Zampini     if (!order) { /* variable order */
590dec27d64SStefano Zampini       PetscReal vorder = 0.;
591dec27d64SStefano Zampini 
592dec27d64SStefano Zampini       for (j=ii[i];j<ii[i+1];j++) vorder += PetscRealPart(vals[j]);
593dec27d64SStefano Zampini       test = PetscFloorReal(vorder+10.*PETSC_SQRT_MACHINE_EPSILON);
594dec27d64SStefano Zampini       if (vorder-test > PETSC_SQRT_MACHINE_EPSILON) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected value for vorder: %g (%d)",vorder,test);
595dec27d64SStefano Zampini       ord  = 1;
596dec27d64SStefano Zampini     }
597a13144ffSStefano Zampini #if defined(PETSC_USE_DEBUG)
598dec27d64SStefano Zampini     if (test%ord) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected number of edge dofs %d connected with nodal dof %d with order %d",test,i,ord);
599a13144ffSStefano Zampini #endif
600637e8532SStefano Zampini     for (j=ii[i];j<ii[i+1] && sneighs;j++) {
6017d871cd7SStefano Zampini       if (PetscBTLookup(btbd,jj[j])) {
6027d871cd7SStefano Zampini         bdir = PETSC_TRUE;
6037d871cd7SStefano Zampini         break;
6047d871cd7SStefano Zampini       }
605637e8532SStefano Zampini       if (vc != ecount[jj[j]]) {
606637e8532SStefano Zampini         sneighs = PETSC_FALSE;
607637e8532SStefano Zampini       } else {
608637e8532SStefano Zampini         PetscInt k,*vn = vneighs[i], *en = eneighs[jj[j]];
609637e8532SStefano Zampini         for (k=0;k<vc;k++) {
610637e8532SStefano Zampini           if (vn[k] != en[k]) {
611637e8532SStefano Zampini             sneighs = PETSC_FALSE;
612637e8532SStefano Zampini             break;
613637e8532SStefano Zampini           }
614637e8532SStefano Zampini         }
615637e8532SStefano Zampini       }
616637e8532SStefano Zampini     }
6177d871cd7SStefano Zampini     if (!sneighs || test >= 3*ord || bdir) { /* splitpoints */
6187d871cd7SStefano Zampini       if (print) PetscPrintf(PETSC_COMM_SELF,"SPLITPOINT %d (%d %d %d)\n",i,!sneighs,test >= 3*ord,bdir);
619a13144ffSStefano Zampini       ierr = PetscBTSet(btv,i);CHKERRQ(ierr);
620dec27d64SStefano Zampini     } else if (test == ord) {
621b03ebc13SStefano Zampini       if (order == 1 || (!order && ii[i+1]-ii[i] == 1)) {
622a13144ffSStefano Zampini         if (print) PetscPrintf(PETSC_COMM_SELF,"ENDPOINT %d\n",i);
623a13144ffSStefano Zampini         ierr = PetscBTSet(btv,i);CHKERRQ(ierr);
624a13144ffSStefano Zampini       } else {
625a13144ffSStefano Zampini         if (print) PetscPrintf(PETSC_COMM_SELF,"CORNER CANDIDATE %d\n",i);
626a13144ffSStefano Zampini         ierr = PetscBTSet(btvcand,i);CHKERRQ(ierr);
627a13144ffSStefano Zampini       }
628a13144ffSStefano Zampini     }
629a13144ffSStefano Zampini   }
630637e8532SStefano Zampini   ierr = PetscFree(ecount);CHKERRQ(ierr);
631637e8532SStefano Zampini   ierr = PetscFree(vcount);CHKERRQ(ierr);
632637e8532SStefano Zampini   if (ne) {
633637e8532SStefano Zampini     ierr = PetscFree(eneighs[0]);CHKERRQ(ierr);
634637e8532SStefano Zampini   }
635637e8532SStefano Zampini   if (nv) {
636637e8532SStefano Zampini     ierr = PetscFree(vneighs[0]);CHKERRQ(ierr);
637637e8532SStefano Zampini   }
638637e8532SStefano Zampini   ierr = PetscFree(eneighs);CHKERRQ(ierr);
639637e8532SStefano Zampini   ierr = PetscFree(vneighs);CHKERRQ(ierr);
6407d871cd7SStefano Zampini   ierr = PetscBTDestroy(&btbd);CHKERRQ(ierr);
641b03ebc13SStefano Zampini 
642b03ebc13SStefano Zampini   /* a candidate is valid if it is connected to another candidate via a non-primal edge dof */
643b03ebc13SStefano Zampini   if (order != 1) {
644b03ebc13SStefano Zampini     if (print) PetscPrintf(PETSC_COMM_SELF,"INSPECTING CANDIDATES\n");
645b03ebc13SStefano Zampini     ierr = MatGetRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
646b03ebc13SStefano Zampini     for (i=0;i<nv;i++) {
647b03ebc13SStefano Zampini       if (PetscBTLookup(btvcand,i)) {
648b03ebc13SStefano Zampini         PetscBool found = PETSC_FALSE;
649b03ebc13SStefano Zampini         for (j=ii[i];j<ii[i+1] && !found;j++) {
650b03ebc13SStefano Zampini           PetscInt k,e = jj[j];
651b03ebc13SStefano Zampini           if (PetscBTLookup(bte,e)) continue;
652b03ebc13SStefano Zampini           for (k=iit[e];k<iit[e+1];k++) {
653b03ebc13SStefano Zampini             PetscInt v = jjt[k];
654b03ebc13SStefano Zampini             if (v != i && PetscBTLookup(btvcand,v)) {
655b03ebc13SStefano Zampini               found = PETSC_TRUE;
656b03ebc13SStefano Zampini               break;
657b03ebc13SStefano Zampini             }
658b03ebc13SStefano Zampini           }
659b03ebc13SStefano Zampini         }
660b03ebc13SStefano Zampini         if (!found) {
661b03ebc13SStefano Zampini           if (print) PetscPrintf(PETSC_COMM_SELF,"  CANDIDATE %d CLEARED\n",i);
662b03ebc13SStefano Zampini           ierr = PetscBTClear(btvcand,i);CHKERRQ(ierr);
663b03ebc13SStefano Zampini         } else {
664b03ebc13SStefano Zampini           if (print) PetscPrintf(PETSC_COMM_SELF,"  CANDIDATE %d ACCEPTED\n",i);
665b03ebc13SStefano Zampini         }
666b03ebc13SStefano Zampini       }
667b03ebc13SStefano Zampini     }
668b03ebc13SStefano Zampini     ierr = MatRestoreRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
669b03ebc13SStefano Zampini   }
670dec27d64SStefano Zampini   ierr = MatSeqAIJRestoreArray(lGt,&vals);CHKERRQ(ierr);
671a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
672b03ebc13SStefano Zampini   ierr = MatDestroy(&lGe);CHKERRQ(ierr);
673a13144ffSStefano Zampini 
674a13144ffSStefano Zampini   /* Get the local G^T explicitly */
6750569b399SStefano Zampini   ierr = MatDestroy(&lGt);CHKERRQ(ierr);
676a13144ffSStefano Zampini   ierr = MatTranspose(lG,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr);
6774e64d54eSstefano_zampini   ierr = MatSetOption(lGt,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr);
678a13144ffSStefano Zampini 
6794e64d54eSstefano_zampini   /* Mark interior nodal dofs */
680a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingGetInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
6814e64d54eSstefano_zampini   ierr = PetscBTCreate(nv,&btvi);CHKERRQ(ierr);
682a13144ffSStefano Zampini   for (i=1;i<n_neigh;i++) {
683a13144ffSStefano Zampini     for (j=0;j<n_shared[i];j++) {
6844e64d54eSstefano_zampini       ierr = PetscBTSet(btvi,shared[i][j]);CHKERRQ(ierr);
685a13144ffSStefano Zampini     }
686a13144ffSStefano Zampini   }
687a13144ffSStefano Zampini   ierr = ISLocalToGlobalMappingRestoreInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
688a13144ffSStefano Zampini 
689a13144ffSStefano Zampini   /* communicate corners and splitpoints */
690a13144ffSStefano Zampini   ierr = PetscMalloc1(nv,&vmarks);CHKERRQ(ierr);
691a13144ffSStefano Zampini   ierr = PetscMemzero(sfvleaves,nv*sizeof(PetscInt));CHKERRQ(ierr);
692a13144ffSStefano Zampini   ierr = PetscMemzero(sfvroots,Lv*sizeof(PetscInt));CHKERRQ(ierr);
693a13144ffSStefano Zampini   for (i=0;i<nv;i++) if (PetscUnlikely(PetscBTLookup(btv,i))) sfvleaves[i] = 1;
694a13144ffSStefano Zampini 
695a13144ffSStefano Zampini   if (print) {
696a13144ffSStefano Zampini     IS tbz;
697a13144ffSStefano Zampini 
698a13144ffSStefano Zampini     cum = 0;
699a13144ffSStefano Zampini     for (i=0;i<nv;i++)
700a13144ffSStefano Zampini       if (sfvleaves[i])
701a13144ffSStefano Zampini         vmarks[cum++] = i;
702a13144ffSStefano Zampini 
703a13144ffSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,vmarks,PETSC_COPY_VALUES,&tbz);CHKERRQ(ierr);
704a13144ffSStefano Zampini     ierr = PetscObjectSetName((PetscObject)tbz,"corners_to_be_zeroed_local");CHKERRQ(ierr);
705a13144ffSStefano Zampini     ierr = ISView(tbz,NULL);CHKERRQ(ierr);
706a13144ffSStefano Zampini     ierr = ISDestroy(&tbz);CHKERRQ(ierr);
707a13144ffSStefano Zampini   }
708a13144ffSStefano Zampini 
709a13144ffSStefano Zampini   ierr = PetscSFReduceBegin(sfv,MPIU_INT,sfvleaves,sfvroots,MPI_SUM);CHKERRQ(ierr);
710a13144ffSStefano Zampini   ierr = PetscSFReduceEnd(sfv,MPIU_INT,sfvleaves,sfvroots,MPI_SUM);CHKERRQ(ierr);
711a13144ffSStefano Zampini   ierr = PetscSFBcastBegin(sfv,MPIU_INT,sfvroots,sfvleaves);CHKERRQ(ierr);
712a13144ffSStefano Zampini   ierr = PetscSFBcastEnd(sfv,MPIU_INT,sfvroots,sfvleaves);CHKERRQ(ierr);
713a13144ffSStefano Zampini 
7144e64d54eSstefano_zampini   /* Zero rows of lGt corresponding to identified corners
7154e64d54eSstefano_zampini      and interior nodal dofs */
716a13144ffSStefano Zampini   cum = 0;
717a13144ffSStefano Zampini   for (i=0;i<nv;i++) {
718a13144ffSStefano Zampini     if (sfvleaves[i]) {
719a13144ffSStefano Zampini       vmarks[cum++] = i;
720a13144ffSStefano Zampini       ierr = PetscBTSet(btv,i);CHKERRQ(ierr);
721a13144ffSStefano Zampini     }
7224e64d54eSstefano_zampini     if (!PetscBTLookup(btvi,i)) vmarks[cum++] = i;
723a13144ffSStefano Zampini   }
7244e64d54eSstefano_zampini   ierr = PetscBTDestroy(&btvi);CHKERRQ(ierr);
725a13144ffSStefano Zampini   if (print) {
726a13144ffSStefano Zampini     IS tbz;
727a13144ffSStefano Zampini 
728a13144ffSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,vmarks,PETSC_COPY_VALUES,&tbz);CHKERRQ(ierr);
7294e64d54eSstefano_zampini     ierr = PetscObjectSetName((PetscObject)tbz,"corners_to_be_zeroed_with_interior");CHKERRQ(ierr);
730a13144ffSStefano Zampini     ierr = ISView(tbz,NULL);CHKERRQ(ierr);
731a13144ffSStefano Zampini     ierr = ISDestroy(&tbz);CHKERRQ(ierr);
732a13144ffSStefano Zampini   }
733a13144ffSStefano Zampini   ierr = MatZeroRows(lGt,cum,vmarks,0.,NULL,NULL);CHKERRQ(ierr);
734a13144ffSStefano Zampini   ierr = PetscFree(vmarks);CHKERRQ(ierr);
735a13144ffSStefano Zampini   ierr = PetscSFDestroy(&sfv);CHKERRQ(ierr);
736a13144ffSStefano Zampini   ierr = PetscFree2(sfvleaves,sfvroots);CHKERRQ(ierr);
737a13144ffSStefano Zampini 
738a13144ffSStefano Zampini   /* Recompute G */
739a13144ffSStefano Zampini   ierr = MatDestroy(&lG);CHKERRQ(ierr);
740a13144ffSStefano Zampini   ierr = MatTranspose(lGt,MAT_INITIAL_MATRIX,&lG);CHKERRQ(ierr);
741a13144ffSStefano Zampini   if (print) {
742a13144ffSStefano Zampini     ierr = PetscObjectSetName((PetscObject)lG,"used_lG");CHKERRQ(ierr);
743a13144ffSStefano Zampini     ierr = MatView(lG,NULL);CHKERRQ(ierr);
744a13144ffSStefano Zampini     ierr = PetscObjectSetName((PetscObject)lGt,"used_lGt");CHKERRQ(ierr);
745a13144ffSStefano Zampini     ierr = MatView(lGt,NULL);CHKERRQ(ierr);
746a13144ffSStefano Zampini   }
747a13144ffSStefano Zampini 
748a13144ffSStefano Zampini   /* Get primal dofs (if any) */
749a13144ffSStefano Zampini   cum = 0;
750a13144ffSStefano Zampini   for (i=0;i<ne;i++) {
751a13144ffSStefano Zampini     if (PetscUnlikely(PetscBTLookup(bte,i))) marks[cum++] = i;
752a13144ffSStefano Zampini   }
753c2151214SStefano Zampini   if (fl2g) {
754c2151214SStefano Zampini     ierr = ISLocalToGlobalMappingApply(fl2g,cum,marks,marks);CHKERRQ(ierr);
755c2151214SStefano Zampini   }
756a13144ffSStefano Zampini   ierr = ISCreateGeneral(comm,cum,marks,PETSC_COPY_VALUES,&primals);CHKERRQ(ierr);
757a13144ffSStefano Zampini   if (print) {
758a13144ffSStefano Zampini     ierr = PetscObjectSetName((PetscObject)primals,"prescribed_primal_dofs");CHKERRQ(ierr);
759a13144ffSStefano Zampini     ierr = ISView(primals,NULL);CHKERRQ(ierr);
760a13144ffSStefano Zampini   }
761a13144ffSStefano Zampini   ierr = PetscBTDestroy(&bte);CHKERRQ(ierr);
762c2151214SStefano Zampini   /* TODO: what if the user passed in some of them ?  */
763a13144ffSStefano Zampini   ierr = PCBDDCSetPrimalVerticesLocalIS(pc,primals);CHKERRQ(ierr);
764a13144ffSStefano Zampini   ierr = ISDestroy(&primals);CHKERRQ(ierr);
765a13144ffSStefano Zampini 
766a13144ffSStefano Zampini   /* Compute edge connectivity */
767a13144ffSStefano Zampini   ierr = PetscObjectSetOptionsPrefix((PetscObject)lG,"econn_");CHKERRQ(ierr);
768a13144ffSStefano Zampini   ierr = MatMatMultSymbolic(lG,lGt,PETSC_DEFAULT,&conn);CHKERRQ(ierr);
769a13144ffSStefano Zampini   ierr = MatGetRowIJ(conn,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
770c2151214SStefano Zampini   if (fl2g) {
771c2151214SStefano Zampini     PetscBT   btf;
772c2151214SStefano Zampini     PetscInt  *iia,*jja,*iiu,*jju;
773c2151214SStefano Zampini     PetscBool rest = PETSC_FALSE,free = PETSC_FALSE;
774c2151214SStefano Zampini 
775c2151214SStefano Zampini     /* create CSR for all local dofs */
776c2151214SStefano Zampini     ierr = PetscMalloc1(n+1,&iia);CHKERRQ(ierr);
777c2151214SStefano Zampini     if (pcbddc->mat_graph->nvtxs_csr) { /* the user has passed in a CSR graph */
778c2151214SStefano Zampini       if (pcbddc->mat_graph->nvtxs_csr != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"Invalid size of CSR graph %d. Should be %d\n",pcbddc->mat_graph->nvtxs_csr,n);
779c2151214SStefano Zampini       iiu = pcbddc->mat_graph->xadj;
780c2151214SStefano Zampini       jju = pcbddc->mat_graph->adjncy;
781c2151214SStefano Zampini     } else if (pcbddc->use_local_adj) {
782c2151214SStefano Zampini       rest = PETSC_TRUE;
783c2151214SStefano Zampini       ierr = MatGetRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&i,(const PetscInt**)&iiu,(const PetscInt**)&jju,&done);CHKERRQ(ierr);
784c2151214SStefano Zampini     } else {
785c2151214SStefano Zampini       free   = PETSC_TRUE;
786c2151214SStefano Zampini       ierr   = PetscMalloc2(n+1,&iiu,n,&jju);CHKERRQ(ierr);
787c2151214SStefano Zampini       iiu[0] = 0;
788c2151214SStefano Zampini       for (i=0;i<n;i++) {
789c2151214SStefano Zampini         iiu[i+1] = i+1;
790c2151214SStefano Zampini         jju[i]   = -1;
791d904f53bSStefano Zampini       }
792c2151214SStefano Zampini     }
793c2151214SStefano Zampini 
794c2151214SStefano Zampini     /* import sizes of CSR */
795c2151214SStefano Zampini     iia[0] = 0;
796c2151214SStefano Zampini     for (i=0;i<n;i++) iia[i+1] = iiu[i+1]-iiu[i];
797c2151214SStefano Zampini 
798c2151214SStefano Zampini     /* overwrite entries corresponding to the Nedelec field */
799c2151214SStefano Zampini     ierr = PetscBTCreate(n,&btf);CHKERRQ(ierr);
800c2151214SStefano Zampini     ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
801c2151214SStefano Zampini     for (i=0;i<ne;i++) {
802c2151214SStefano Zampini       ierr = PetscBTSet(btf,idxs[i]);CHKERRQ(ierr);
803c2151214SStefano Zampini       iia[idxs[i]+1] = ii[i+1]-ii[i];
804c2151214SStefano Zampini     }
805c2151214SStefano Zampini 
806c2151214SStefano Zampini     /* iia in CSR */
807c2151214SStefano Zampini     for (i=0;i<n;i++) iia[i+1] += iia[i];
808c2151214SStefano Zampini 
809c2151214SStefano Zampini     /* jja in CSR */
810c2151214SStefano Zampini     ierr = PetscMalloc1(iia[n],&jja);CHKERRQ(ierr);
811c2151214SStefano Zampini     for (i=0;i<n;i++)
812c2151214SStefano Zampini       if (!PetscBTLookup(btf,i))
813c2151214SStefano Zampini         for (j=0;j<iiu[i+1]-iiu[i];j++)
814c2151214SStefano Zampini           jja[iia[i]+j] = jju[iiu[i]+j];
815c2151214SStefano Zampini 
816c2151214SStefano Zampini     /* map edge dofs connectivity */
8171e0482f5SStefano Zampini     if (jj) {
818c2151214SStefano Zampini       ierr = ISLocalToGlobalMappingApply(fl2g,ii[ne],jj,(PetscInt *)jj);CHKERRQ(ierr);
819c2151214SStefano Zampini       for (i=0;i<ne;i++) {
820c2151214SStefano Zampini         PetscInt e = idxs[i];
821c2151214SStefano Zampini         for (j=0;j<ii[i+1]-ii[i];j++) jja[iia[e]+j] = jj[ii[i]+j];
822c2151214SStefano Zampini       }
8231e0482f5SStefano Zampini     }
824c2151214SStefano Zampini     ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr);
825c2151214SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,n,iia,jja,PETSC_OWN_POINTER);CHKERRQ(ierr);
826c2151214SStefano Zampini     if (rest) {
827c2151214SStefano Zampini       ierr = MatRestoreRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&i,(const PetscInt**)&iiu,(const PetscInt**)&jju,&done);CHKERRQ(ierr);
828c2151214SStefano Zampini     }
829c2151214SStefano Zampini     if (free) {
830c2151214SStefano Zampini       ierr = PetscFree2(iiu,jju);CHKERRQ(ierr);
831c2151214SStefano Zampini     }
832c2151214SStefano Zampini     ierr = PetscBTDestroy(&btf);CHKERRQ(ierr);
833c2151214SStefano Zampini   } else {
834c2151214SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,n,ii,jj,PETSC_USE_POINTER);CHKERRQ(ierr);
835c2151214SStefano Zampini   }
836c2151214SStefano Zampini 
837a13144ffSStefano Zampini   /* Analyze interface for edge dofs */
838a13144ffSStefano Zampini   ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr);
839213b8bfaSStefano Zampini   pcbddc->mat_graph->twodim = PETSC_FALSE;
840a13144ffSStefano Zampini 
841a13144ffSStefano Zampini   /* Get coarse edges in the edge space */
842c2151214SStefano Zampini   ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr);
843a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(conn,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
844a13144ffSStefano Zampini 
845c2151214SStefano Zampini   if (fl2g) {
846c2151214SStefano Zampini     ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,allprimals,&primals);CHKERRQ(ierr);
847c2151214SStefano Zampini     ierr = PetscMalloc1(nee,&eedges);CHKERRQ(ierr);
848c2151214SStefano Zampini     for (i=0;i<nee;i++) {
849c2151214SStefano Zampini       ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,alleedges[i],&eedges[i]);CHKERRQ(ierr);
850c2151214SStefano Zampini     }
851c2151214SStefano Zampini   } else {
852c2151214SStefano Zampini     eedges  = alleedges;
853c2151214SStefano Zampini     primals = allprimals;
854c2151214SStefano Zampini   }
855c2151214SStefano Zampini 
856a13144ffSStefano Zampini   /* Mark fine edge dofs with their coarse edge id */
857a13144ffSStefano Zampini   ierr = PetscMemzero(marks,ne*sizeof(PetscInt));CHKERRQ(ierr);
858c2151214SStefano Zampini   ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr);
859c2151214SStefano Zampini   ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr);
860c2151214SStefano Zampini   for (i=0;i<cum;i++) marks[idxs[i]] = nee+1;
861c2151214SStefano Zampini   ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr);
862c2151214SStefano Zampini   if (print) {
863c2151214SStefano Zampini     ierr = PetscObjectSetName((PetscObject)primals,"obtained_primal_dofs");CHKERRQ(ierr);
864c2151214SStefano Zampini     ierr = ISView(primals,NULL);CHKERRQ(ierr);
865c2151214SStefano Zampini   }
866c2151214SStefano Zampini 
867c2151214SStefano Zampini   maxsize = 0;
868a13144ffSStefano Zampini   for (i=0;i<nee;i++) {
869a13144ffSStefano Zampini     PetscInt size,mark = i+1;
870a13144ffSStefano Zampini 
871a13144ffSStefano Zampini     ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
872a13144ffSStefano Zampini     ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
873a13144ffSStefano Zampini     for (j=0;j<size;j++) marks[idxs[j]] = mark;
874a13144ffSStefano Zampini     ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
875a13144ffSStefano Zampini     maxsize = PetscMax(maxsize,size);
876a13144ffSStefano Zampini   }
877a13144ffSStefano Zampini 
878a13144ffSStefano Zampini   /* Find coarse edge endpoints */
879a13144ffSStefano Zampini   ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
880a13144ffSStefano Zampini   ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
881a13144ffSStefano Zampini   for (i=0;i<nee;i++) {
882a13144ffSStefano Zampini     PetscInt mark = i+1,size;
883a13144ffSStefano Zampini 
884a13144ffSStefano Zampini     ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
8851e0482f5SStefano Zampini     if (!size && nedfieldlocal) continue;
8861e0482f5SStefano Zampini     if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i);
887a13144ffSStefano Zampini     ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
888a13144ffSStefano Zampini     if (print) {
889a13144ffSStefano Zampini       PetscPrintf(PETSC_COMM_SELF,"ENDPOINTS ANALYSIS EDGE %d\n",i);
890a13144ffSStefano Zampini       ISView(eedges[i],NULL);
891a13144ffSStefano Zampini     }
892a13144ffSStefano Zampini     for (j=0;j<size;j++) {
893a13144ffSStefano Zampini       PetscInt k, ee = idxs[j];
894a13144ffSStefano Zampini       if (print) PetscPrintf(PETSC_COMM_SELF,"  idx %d\n",ee);
895a13144ffSStefano Zampini       for (k=ii[ee];k<ii[ee+1];k++) {
896a13144ffSStefano Zampini         if (print) PetscPrintf(PETSC_COMM_SELF,"    inspect %d\n",jj[k]);
897a13144ffSStefano Zampini         if (PetscBTLookup(btv,jj[k])) {
898a13144ffSStefano Zampini           if (print) PetscPrintf(PETSC_COMM_SELF,"      corner found (already set) %d\n",jj[k]);
899a13144ffSStefano Zampini         } else if (PetscBTLookup(btvcand,jj[k])) { /* is it ok? */
900a13144ffSStefano Zampini           PetscInt  k2;
901a13144ffSStefano Zampini           PetscBool corner = PETSC_FALSE;
902a13144ffSStefano Zampini           for (k2 = iit[jj[k]];k2 < iit[jj[k]+1];k2++) {
903c2151214SStefano Zampini             if (print) PetscPrintf(PETSC_COMM_SELF,"        INSPECTING %d: mark %d (ref mark %d), boundary %d\n",jjt[k2],marks[jjt[k2]],mark,!!PetscBTLookup(btb,jjt[k2]));
904c2151214SStefano Zampini             /* it's a corner if either is connected with an edge dof belonging to a different cc or
905c2151214SStefano Zampini                if the edge dof lie on the natural part of the boundary */
906c2151214SStefano Zampini             if ((marks[jjt[k2]] && marks[jjt[k2]] != mark) || (!marks[jjt[k2]] && PetscBTLookup(btb,jjt[k2]))) {
907a13144ffSStefano Zampini               corner = PETSC_TRUE;
908a13144ffSStefano Zampini               break;
909a13144ffSStefano Zampini             }
910a13144ffSStefano Zampini           }
911a13144ffSStefano Zampini           if (corner) { /* found the nodal dof corresponding to the endpoint of the edge */
912a13144ffSStefano Zampini             if (print) PetscPrintf(PETSC_COMM_SELF,"        corner found %d\n",jj[k]);
913a13144ffSStefano Zampini             ierr = PetscBTSet(btv,jj[k]);CHKERRQ(ierr);
914a13144ffSStefano Zampini           } else {
915a13144ffSStefano Zampini             if (print) PetscPrintf(PETSC_COMM_SELF,"        no corners found\n");
916a13144ffSStefano Zampini           }
917a13144ffSStefano Zampini         }
918a13144ffSStefano Zampini       }
919a13144ffSStefano Zampini     }
920a13144ffSStefano Zampini     ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
921a13144ffSStefano Zampini   }
922a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
923a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
924c2151214SStefano Zampini   ierr = PetscBTDestroy(&btb);CHKERRQ(ierr);
925a13144ffSStefano Zampini 
926a13144ffSStefano Zampini   /* Reset marked primal dofs */
927a13144ffSStefano Zampini   ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr);
928a13144ffSStefano Zampini   ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr);
929a13144ffSStefano Zampini   for (i=0;i<cum;i++) marks[idxs[i]] = 0;
930a13144ffSStefano Zampini   ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr);
931a13144ffSStefano Zampini 
9320569b399SStefano Zampini   /* Now use the initial lG */
9330569b399SStefano Zampini   ierr = MatDestroy(&lG);CHKERRQ(ierr);
9340569b399SStefano Zampini   ierr = MatDestroy(&lGt);CHKERRQ(ierr);
9350569b399SStefano Zampini   lG   = lGinit;
9360569b399SStefano Zampini   ierr = MatTranspose(lG,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr);
9370569b399SStefano Zampini 
938a13144ffSStefano Zampini   /* Compute extended cols indices */
939b03ebc13SStefano Zampini   ierr = PetscBTCreate(nv,&btvc);CHKERRQ(ierr);
940b03ebc13SStefano Zampini   ierr = PetscBTCreate(nee,&bter);CHKERRQ(ierr);
941a13144ffSStefano Zampini   ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
942a13144ffSStefano Zampini   ierr = MatSeqAIJGetMaxRowNonzeros(lG,&i);CHKERRQ(ierr);
943a13144ffSStefano Zampini   i   *= maxsize;
944b03ebc13SStefano Zampini   ierr = PetscCalloc1(nee,&extcols);CHKERRQ(ierr);
945a13144ffSStefano Zampini   ierr = PetscMalloc2(i,&extrow,i,&gidxs);CHKERRQ(ierr);
946a13144ffSStefano Zampini   eerr = PETSC_FALSE;
947a13144ffSStefano Zampini   for (i=0;i<nee;i++) {
948b03ebc13SStefano Zampini     PetscInt size,found = 0;
949a13144ffSStefano Zampini 
950a13144ffSStefano Zampini     cum  = 0;
951a13144ffSStefano Zampini     ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
9521e0482f5SStefano Zampini     if (!size && nedfieldlocal) continue;
9531e0482f5SStefano Zampini     if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i);
954a13144ffSStefano Zampini     ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
955b03ebc13SStefano Zampini     ierr = PetscBTMemzero(nv,btvc);CHKERRQ(ierr);
956a13144ffSStefano Zampini     for (j=0;j<size;j++) {
957a13144ffSStefano Zampini       PetscInt k,ee = idxs[j];
958b03ebc13SStefano Zampini       for (k=ii[ee];k<ii[ee+1];k++) {
959b03ebc13SStefano Zampini         PetscInt vv = jj[k];
960b03ebc13SStefano Zampini         if (!PetscBTLookup(btv,vv)) extrow[cum++] = vv;
961b03ebc13SStefano Zampini         else if (!PetscBTLookupSet(btvc,vv)) found++;
962b03ebc13SStefano Zampini       }
963a13144ffSStefano Zampini     }
964a13144ffSStefano Zampini     ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
965a13144ffSStefano Zampini     ierr = PetscSortRemoveDupsInt(&cum,extrow);CHKERRQ(ierr);
966a13144ffSStefano Zampini     ierr = ISLocalToGlobalMappingApply(vl2g,cum,extrow,gidxs);CHKERRQ(ierr);
967a13144ffSStefano Zampini     ierr = PetscSortIntWithArray(cum,gidxs,extrow);CHKERRQ(ierr);
968a13144ffSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,extrow,PETSC_COPY_VALUES,&extcols[i]);CHKERRQ(ierr);
969a13144ffSStefano Zampini     /* it may happen that endpoints are not defined at this point
970a13144ffSStefano Zampini        if it is the case, mark this edge for a second pass */
971b03ebc13SStefano Zampini     if (cum != size -1 || found != 2) {
972b03ebc13SStefano Zampini       ierr = PetscBTSet(bter,i);CHKERRQ(ierr);
973a13144ffSStefano Zampini       if (print) {
974a13144ffSStefano Zampini         ierr = PetscObjectSetName((PetscObject)eedges[i],"error_edge");CHKERRQ(ierr);
975a13144ffSStefano Zampini         ierr = ISView(eedges[i],NULL);CHKERRQ(ierr);
976a13144ffSStefano Zampini         ierr = PetscObjectSetName((PetscObject)extcols[i],"error_extcol");CHKERRQ(ierr);
977a13144ffSStefano Zampini         ierr = ISView(extcols[i],NULL);CHKERRQ(ierr);
978a13144ffSStefano Zampini       }
979a13144ffSStefano Zampini       eerr = PETSC_TRUE;
980a13144ffSStefano Zampini     }
981a13144ffSStefano Zampini   }
9824e64d54eSstefano_zampini   /* if (eerr) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected SIZE OF EDGE > EXTCOL FIRST PASS"); */
983a13144ffSStefano Zampini   ierr = MPIU_Allreduce(&eerr,&done,1,MPIU_BOOL,MPI_LOR,comm);CHKERRQ(ierr);
984a13144ffSStefano Zampini   if (done) {
985a13144ffSStefano Zampini     PetscInt *newprimals;
986a13144ffSStefano Zampini 
987a13144ffSStefano Zampini     ierr = PetscMalloc1(ne,&newprimals);CHKERRQ(ierr);
988a13144ffSStefano Zampini     ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr);
989a13144ffSStefano Zampini     ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr);
990a13144ffSStefano Zampini     ierr = PetscMemcpy(newprimals,idxs,cum*sizeof(PetscInt));CHKERRQ(ierr);
991a13144ffSStefano Zampini     ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr);
9920569b399SStefano Zampini     ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
993b03ebc13SStefano Zampini     if (print) PetscPrintf(PETSC_COMM_SELF,"DOING SECOND PASS (eerr %d)\n",eerr);
994a13144ffSStefano Zampini     for (i=0;i<nee;i++) {
995b03ebc13SStefano Zampini       PetscBool has_candidates = PETSC_FALSE;
996b03ebc13SStefano Zampini       if (PetscBTLookup(bter,i)) {
997a13144ffSStefano Zampini         PetscInt size,mark = i+1;
998a13144ffSStefano Zampini 
999a13144ffSStefano Zampini         ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
1000a13144ffSStefano Zampini         ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
1001c2151214SStefano Zampini         /* for (j=0;j<size;j++) newprimals[cum++] = idxs[j]; */
1002a13144ffSStefano Zampini         for (j=0;j<size;j++) {
1003a13144ffSStefano Zampini           PetscInt k,ee = idxs[j];
1004b03ebc13SStefano Zampini           if (print) PetscPrintf(PETSC_COMM_SELF,"Inspecting edge dof %d [%d %d)\n",ee,ii[ee],ii[ee+1]);
1005a13144ffSStefano Zampini           for (k=ii[ee];k<ii[ee+1];k++) {
1006a13144ffSStefano Zampini             /* set all candidates located on the edge as corners */
1007a13144ffSStefano Zampini             if (PetscBTLookup(btvcand,jj[k])) {
1008a13144ffSStefano Zampini               PetscInt k2,vv = jj[k];
1009b03ebc13SStefano Zampini               has_candidates = PETSC_TRUE;
1010b03ebc13SStefano Zampini               if (print) PetscPrintf(PETSC_COMM_SELF,"  Candidate set to vertex %d\n",vv);
1011a13144ffSStefano Zampini               ierr = PetscBTSet(btv,vv);CHKERRQ(ierr);
1012a13144ffSStefano Zampini               /* set all edge dofs connected to candidate as primals */
1013a13144ffSStefano Zampini               for (k2=iit[vv];k2<iit[vv+1];k2++) {
1014a13144ffSStefano Zampini                 if (marks[jjt[k2]] == mark) {
1015a13144ffSStefano Zampini                   PetscInt k3,ee2 = jjt[k2];
1016b03ebc13SStefano Zampini                   if (print) PetscPrintf(PETSC_COMM_SELF,"    Connected edge dof set to primal %d\n",ee2);
1017a13144ffSStefano Zampini                   newprimals[cum++] = ee2;
1018a13144ffSStefano Zampini                   /* finally set the new corners */
1019a13144ffSStefano Zampini                   for (k3=ii[ee2];k3<ii[ee2+1];k3++) {
1020b03ebc13SStefano Zampini                     if (print) PetscPrintf(PETSC_COMM_SELF,"      Connected nodal dof set to vertex %d\n",jj[k3]);
1021a13144ffSStefano Zampini                     ierr = PetscBTSet(btv,jj[k3]);CHKERRQ(ierr);
1022a13144ffSStefano Zampini                   }
1023a13144ffSStefano Zampini                 }
1024a13144ffSStefano Zampini               }
1025b03ebc13SStefano Zampini             } else {
1026b03ebc13SStefano Zampini               if (print) PetscPrintf(PETSC_COMM_SELF,"  Not a candidate vertex %d\n",jj[k]);
1027a13144ffSStefano Zampini             }
1028a13144ffSStefano Zampini           }
1029a13144ffSStefano Zampini         }
1030b03ebc13SStefano Zampini         if (!has_candidates) { /* circular edge */
1031b03ebc13SStefano Zampini           PetscInt k, ee = idxs[0],*tmarks;
1032b03ebc13SStefano Zampini 
1033b03ebc13SStefano Zampini           ierr = PetscCalloc1(ne,&tmarks);CHKERRQ(ierr);
1034b03ebc13SStefano Zampini           if (print) PetscPrintf(PETSC_COMM_SELF,"  Circular edge %d\n",i);
1035b03ebc13SStefano Zampini           for (k=ii[ee];k<ii[ee+1];k++) {
1036b03ebc13SStefano Zampini             PetscInt k2;
1037b03ebc13SStefano Zampini             if (print) PetscPrintf(PETSC_COMM_SELF,"    Set to corner %d\n",jj[k]);
1038b03ebc13SStefano Zampini             ierr = PetscBTSet(btv,jj[k]);CHKERRQ(ierr);
1039b03ebc13SStefano Zampini             for (k2=iit[jj[k]];k2<iit[jj[k]+1];k2++) tmarks[jjt[k2]]++;
1040b03ebc13SStefano Zampini           }
1041b03ebc13SStefano Zampini           for (j=0;j<size;j++) {
1042b03ebc13SStefano Zampini             if (tmarks[idxs[j]] > 1) {
1043b03ebc13SStefano Zampini               if (print) PetscPrintf(PETSC_COMM_SELF,"  Edge dof set to primal %d\n",idxs[j]);
1044b03ebc13SStefano Zampini               newprimals[cum++] = idxs[j];
1045b03ebc13SStefano Zampini             }
1046b03ebc13SStefano Zampini           }
1047b03ebc13SStefano Zampini           ierr = PetscFree(tmarks);CHKERRQ(ierr);
1048b03ebc13SStefano Zampini         }
1049a13144ffSStefano Zampini         ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
1050a13144ffSStefano Zampini       }
1051a13144ffSStefano Zampini       ierr = ISDestroy(&extcols[i]);CHKERRQ(ierr);
1052a13144ffSStefano Zampini     }
1053b03ebc13SStefano Zampini     ierr = PetscFree(extcols);CHKERRQ(ierr);
10540569b399SStefano Zampini     ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr);
1055a13144ffSStefano Zampini     ierr = PetscSortRemoveDupsInt(&cum,newprimals);CHKERRQ(ierr);
1056c2151214SStefano Zampini     if (fl2g) {
1057c2151214SStefano Zampini       ierr = ISLocalToGlobalMappingApply(fl2g,cum,newprimals,newprimals);CHKERRQ(ierr);
1058c2151214SStefano Zampini       ierr = ISDestroy(&primals);CHKERRQ(ierr);
1059c2151214SStefano Zampini       for (i=0;i<nee;i++) {
1060c2151214SStefano Zampini         ierr = ISDestroy(&eedges[i]);CHKERRQ(ierr);
1061c2151214SStefano Zampini       }
1062c2151214SStefano Zampini       ierr = PetscFree(eedges);CHKERRQ(ierr);
1063c2151214SStefano Zampini     }
1064c2151214SStefano Zampini     ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr);
1065a13144ffSStefano Zampini     ierr = ISCreateGeneral(comm,cum,newprimals,PETSC_COPY_VALUES,&primals);CHKERRQ(ierr);
1066a13144ffSStefano Zampini     ierr = PetscFree(newprimals);CHKERRQ(ierr);
1067a13144ffSStefano Zampini     ierr = PCBDDCSetPrimalVerticesLocalIS(pc,primals);CHKERRQ(ierr);
1068a13144ffSStefano Zampini     ierr = ISDestroy(&primals);CHKERRQ(ierr);
1069a13144ffSStefano Zampini     ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr);
1070213b8bfaSStefano Zampini     pcbddc->mat_graph->twodim = PETSC_FALSE;
1071c2151214SStefano Zampini     ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr);
1072c2151214SStefano Zampini     if (fl2g) {
1073c2151214SStefano Zampini       ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,allprimals,&primals);CHKERRQ(ierr);
1074c2151214SStefano Zampini       ierr = PetscMalloc1(nee,&eedges);CHKERRQ(ierr);
1075c2151214SStefano Zampini       for (i=0;i<nee;i++) {
1076c2151214SStefano Zampini         ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,alleedges[i],&eedges[i]);CHKERRQ(ierr);
1077c2151214SStefano Zampini       }
1078c2151214SStefano Zampini     } else {
1079c2151214SStefano Zampini       eedges  = alleedges;
1080c2151214SStefano Zampini       primals = allprimals;
1081c2151214SStefano Zampini     }
1082b03ebc13SStefano Zampini     ierr = PetscCalloc1(nee,&extcols);CHKERRQ(ierr);
1083a13144ffSStefano Zampini 
1084a13144ffSStefano Zampini     /* Mark again */
1085a13144ffSStefano Zampini     ierr = PetscMemzero(marks,ne*sizeof(PetscInt));CHKERRQ(ierr);
1086a13144ffSStefano Zampini     for (i=0;i<nee;i++) {
1087a13144ffSStefano Zampini       PetscInt size,mark = i+1;
1088a13144ffSStefano Zampini 
1089a13144ffSStefano Zampini       ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
1090a13144ffSStefano Zampini       ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
1091a13144ffSStefano Zampini       for (j=0;j<size;j++) marks[idxs[j]] = mark;
1092a13144ffSStefano Zampini       ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
1093a13144ffSStefano Zampini     }
1094a13144ffSStefano Zampini     if (print) {
1095a13144ffSStefano Zampini       ierr = PetscObjectSetName((PetscObject)primals,"obtained_primal_dofs_secondpass");CHKERRQ(ierr);
1096a13144ffSStefano Zampini       ierr = ISView(primals,NULL);CHKERRQ(ierr);
1097a13144ffSStefano Zampini     }
1098a13144ffSStefano Zampini 
1099a13144ffSStefano Zampini     /* Recompute extended cols */
1100a13144ffSStefano Zampini     eerr = PETSC_FALSE;
1101a13144ffSStefano Zampini     for (i=0;i<nee;i++) {
1102a13144ffSStefano Zampini       PetscInt size;
1103a13144ffSStefano Zampini 
1104a13144ffSStefano Zampini       cum  = 0;
1105a13144ffSStefano Zampini       ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
11061e0482f5SStefano Zampini       if (!size && nedfieldlocal) continue;
11071e0482f5SStefano Zampini       if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i);
1108a13144ffSStefano Zampini       ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
1109a13144ffSStefano Zampini       for (j=0;j<size;j++) {
1110a13144ffSStefano Zampini         PetscInt k,ee = idxs[j];
11111e0482f5SStefano Zampini         for (k=ii[ee];k<ii[ee+1];k++) if (!PetscBTLookup(btv,jj[k])) extrow[cum++] = jj[k];
1112a13144ffSStefano Zampini       }
1113a13144ffSStefano Zampini       ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
1114a13144ffSStefano Zampini       ierr = PetscSortRemoveDupsInt(&cum,extrow);CHKERRQ(ierr);
1115a13144ffSStefano Zampini       ierr = ISLocalToGlobalMappingApply(vl2g,cum,extrow,gidxs);CHKERRQ(ierr);
1116a13144ffSStefano Zampini       ierr = PetscSortIntWithArray(cum,gidxs,extrow);CHKERRQ(ierr);
1117a13144ffSStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,extrow,PETSC_COPY_VALUES,&extcols[i]);CHKERRQ(ierr);
1118a13144ffSStefano Zampini       if (cum != size -1) {
1119a13144ffSStefano Zampini         if (print) {
1120a13144ffSStefano Zampini           ierr = PetscObjectSetName((PetscObject)eedges[i],"error_edge_secondpass");CHKERRQ(ierr);
1121a13144ffSStefano Zampini           ierr = ISView(eedges[i],NULL);CHKERRQ(ierr);
1122a13144ffSStefano Zampini           ierr = PetscObjectSetName((PetscObject)extcols[i],"error_extcol_secondpass");CHKERRQ(ierr);
1123a13144ffSStefano Zampini           ierr = ISView(extcols[i],NULL);CHKERRQ(ierr);
1124a13144ffSStefano Zampini         }
1125a13144ffSStefano Zampini         eerr = PETSC_TRUE;
1126a13144ffSStefano Zampini       }
1127a13144ffSStefano Zampini     }
1128a13144ffSStefano Zampini   }
1129a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
1130a13144ffSStefano Zampini   ierr = PetscFree2(extrow,gidxs);CHKERRQ(ierr);
1131b03ebc13SStefano Zampini   ierr = PetscBTDestroy(&bter);CHKERRQ(ierr);
11327d871cd7SStefano Zampini   if (print) { ierr = PCBDDCGraphASCIIView(pcbddc->mat_graph,5,PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr); }
1133a13144ffSStefano Zampini   /* an error should not occur at this point */
1134a13144ffSStefano Zampini   if (eerr) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected SIZE OF EDGE > EXTCOL SECOND PASS");
1135a13144ffSStefano Zampini 
11364e64d54eSstefano_zampini   /* Check the number of endpoints */
11370569b399SStefano Zampini   ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
1138b03ebc13SStefano Zampini   ierr = PetscMalloc1(2*nee,&corners);CHKERRQ(ierr);
1139b03ebc13SStefano Zampini   ierr = PetscMalloc1(nee,&cedges);CHKERRQ(ierr);
11404e64d54eSstefano_zampini   for (i=0;i<nee;i++) {
1141b03ebc13SStefano Zampini     PetscInt size, found = 0, gc[2];
11424e64d54eSstefano_zampini 
1143b03ebc13SStefano Zampini     /* init with defaults */
1144b03ebc13SStefano Zampini     cedges[i] = corners[i*2] = corners[i*2+1] = -1;
11454e64d54eSstefano_zampini     ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr);
11461e0482f5SStefano Zampini     if (!size && nedfieldlocal) continue;
11471e0482f5SStefano Zampini     if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i);
11484e64d54eSstefano_zampini     ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr);
1149b03ebc13SStefano Zampini     ierr = PetscBTMemzero(nv,btvc);CHKERRQ(ierr);
11504e64d54eSstefano_zampini     for (j=0;j<size;j++) {
11514e64d54eSstefano_zampini       PetscInt k,ee = idxs[j];
11524e64d54eSstefano_zampini       for (k=ii[ee];k<ii[ee+1];k++) {
11534e64d54eSstefano_zampini         PetscInt vv = jj[k];
11544e64d54eSstefano_zampini         if (PetscBTLookup(btv,vv) && !PetscBTLookupSet(btvc,vv)) {
1155b03ebc13SStefano Zampini           if (found == 2) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Found more then two corners for edge %d\n",i);
1156b03ebc13SStefano Zampini           corners[i*2+found++] = vv;
11574e64d54eSstefano_zampini         }
11584e64d54eSstefano_zampini       }
11594e64d54eSstefano_zampini     }
1160b03ebc13SStefano Zampini     if (found != 2) {
1161b03ebc13SStefano Zampini       PetscInt e;
1162b03ebc13SStefano Zampini       if (fl2g) {
1163b03ebc13SStefano Zampini         ierr = ISLocalToGlobalMappingApply(fl2g,1,idxs,&e);CHKERRQ(ierr);
1164b03ebc13SStefano Zampini       } else {
1165b03ebc13SStefano Zampini         e = idxs[0];
1166b03ebc13SStefano Zampini       }
1167b03ebc13SStefano Zampini       SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Found %d corners for edge %d (astart %d, estart %d)\n",found,i,e,idxs[0]);
1168b03ebc13SStefano Zampini     }
1169eee23b56SStefano Zampini 
1170eee23b56SStefano Zampini     /* get primal dof index on this coarse edge */
1171b03ebc13SStefano Zampini     ierr = ISLocalToGlobalMappingApply(vl2g,2,corners+2*i,gc);CHKERRQ(ierr);
1172b03ebc13SStefano Zampini     if (gc[0] > gc[1]) {
1173b03ebc13SStefano Zampini       PetscInt swap  = corners[2*i];
1174b03ebc13SStefano Zampini       corners[2*i]   = corners[2*i+1];
1175b03ebc13SStefano Zampini       corners[2*i+1] = swap;
1176b03ebc13SStefano Zampini     }
1177eee23b56SStefano Zampini     cedges[i] = idxs[size-1];
11784e64d54eSstefano_zampini     ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr);
1179b03ebc13SStefano Zampini     if (print) PetscPrintf(PETSC_COMM_SELF,"EDGE %d: ce %d, corners (%d,%d)\n",i,cedges[i],corners[2*i],corners[2*i+1]);
11804e64d54eSstefano_zampini   }
11810569b399SStefano Zampini   ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
11824e64d54eSstefano_zampini   ierr = PetscBTDestroy(&btvc);CHKERRQ(ierr);
11834e64d54eSstefano_zampini 
1184a13144ffSStefano Zampini #if defined(PETSC_USE_DEBUG)
1185a13144ffSStefano Zampini   /* Inspects columns of lG (rows of lGt) and make sure the change of basis will
1186a13144ffSStefano Zampini      not interfere with neighbouring coarse edges */
1187a13144ffSStefano Zampini   ierr = PetscMalloc1(nee+1,&emarks);CHKERRQ(ierr);
1188a13144ffSStefano Zampini   ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
1189a13144ffSStefano Zampini   for (i=0;i<nv;i++) {
1190a13144ffSStefano Zampini     PetscInt emax = 0,eemax = 0;
1191a13144ffSStefano Zampini 
1192a13144ffSStefano Zampini     if (ii[i+1]==ii[i] || PetscBTLookup(btv,i)) continue;
1193a13144ffSStefano Zampini     ierr = PetscMemzero(emarks,(nee+1)*sizeof(PetscInt));CHKERRQ(ierr);
1194a13144ffSStefano Zampini     for (j=ii[i];j<ii[i+1];j++) emarks[marks[jj[j]]]++;
1195a13144ffSStefano Zampini     for (j=1;j<nee+1;j++) {
1196a13144ffSStefano Zampini       if (emax < emarks[j]) {
1197a13144ffSStefano Zampini         emax = emarks[j];
1198a13144ffSStefano Zampini         eemax = j;
1199a13144ffSStefano Zampini       }
1200a13144ffSStefano Zampini     }
1201a13144ffSStefano Zampini     /* not relevant for edges */
1202a13144ffSStefano Zampini     if (!eemax) continue;
1203a13144ffSStefano Zampini 
1204a13144ffSStefano Zampini     for (j=ii[i];j<ii[i+1];j++) {
1205a13144ffSStefano Zampini       if (marks[jj[j]] && marks[jj[j]] != eemax) {
1206c2151214SStefano Zampini         SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_SUP,"Found 2 coarse edges (id %d and %d) connected through the %d nodal dof at edge dof %d\n",marks[jj[j]]-1,eemax,i,jj[j]);
1207a13144ffSStefano Zampini       }
1208a13144ffSStefano Zampini     }
1209a13144ffSStefano Zampini   }
1210a13144ffSStefano Zampini   ierr = PetscFree(emarks);CHKERRQ(ierr);
1211a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
1212a13144ffSStefano Zampini #endif
1213a13144ffSStefano Zampini 
1214a13144ffSStefano Zampini   /* Compute extended rows indices for edge blocks of the change of basis */
1215a13144ffSStefano Zampini   ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
1216a13144ffSStefano Zampini   ierr = MatSeqAIJGetMaxRowNonzeros(lGt,&extmem);CHKERRQ(ierr);
1217a13144ffSStefano Zampini   extmem *= maxsize;
1218a13144ffSStefano Zampini   ierr = PetscMalloc1(extmem*nee,&extrow);CHKERRQ(ierr);
1219a13144ffSStefano Zampini   ierr = PetscMalloc1(nee,&extrows);CHKERRQ(ierr);
1220a13144ffSStefano Zampini   ierr = PetscCalloc1(nee,&extrowcum);CHKERRQ(ierr);
1221a13144ffSStefano Zampini   for (i=0;i<nv;i++) {
1222a13144ffSStefano Zampini     PetscInt mark = 0,size,start;
1223213b8bfaSStefano Zampini 
1224a13144ffSStefano Zampini     if (ii[i+1]==ii[i] || PetscBTLookup(btv,i)) continue;
1225a13144ffSStefano Zampini     for (j=ii[i];j<ii[i+1];j++)
1226a13144ffSStefano Zampini       if (marks[jj[j]] && !mark)
1227a13144ffSStefano Zampini         mark = marks[jj[j]];
1228a13144ffSStefano Zampini 
1229a13144ffSStefano Zampini     /* not relevant */
1230a13144ffSStefano Zampini     if (!mark) continue;
1231a13144ffSStefano Zampini 
1232a13144ffSStefano Zampini     /* import extended row */
1233a13144ffSStefano Zampini     mark--;
1234a13144ffSStefano Zampini     start = mark*extmem+extrowcum[mark];
1235a13144ffSStefano Zampini     size = ii[i+1]-ii[i];
1236a13144ffSStefano Zampini     if (extrowcum[mark] + size > extmem) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Not enough memory allocated %d > %d",extrowcum[mark] + size,extmem);
1237a13144ffSStefano Zampini     ierr = PetscMemcpy(extrow+start,jj+ii[i],size*sizeof(PetscInt));CHKERRQ(ierr);
1238a13144ffSStefano Zampini     extrowcum[mark] += size;
1239a13144ffSStefano Zampini   }
1240a13144ffSStefano Zampini   ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr);
1241213b8bfaSStefano Zampini   ierr = MatDestroy(&lGt);CHKERRQ(ierr);
1242213b8bfaSStefano Zampini   ierr = PetscFree(marks);CHKERRQ(ierr);
1243213b8bfaSStefano Zampini 
1244213b8bfaSStefano Zampini   /* Compress extrows */
1245a13144ffSStefano Zampini   cum  = 0;
1246a13144ffSStefano Zampini   for (i=0;i<nee;i++) {
1247a13144ffSStefano Zampini     PetscInt size = extrowcum[i],*start = extrow + i*extmem;
1248a13144ffSStefano Zampini     ierr = PetscSortRemoveDupsInt(&size,start);CHKERRQ(ierr);
1249a13144ffSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,size,start,PETSC_USE_POINTER,&extrows[i]);CHKERRQ(ierr);
1250a13144ffSStefano Zampini     cum  = PetscMax(cum,size);
1251a13144ffSStefano Zampini   }
1252a13144ffSStefano Zampini   ierr = PetscFree(extrowcum);CHKERRQ(ierr);
1253a13144ffSStefano Zampini   ierr = PetscBTDestroy(&btv);CHKERRQ(ierr);
1254a13144ffSStefano Zampini   ierr = PetscBTDestroy(&btvcand);CHKERRQ(ierr);
1255a13144ffSStefano Zampini 
1256a13144ffSStefano Zampini   /* Workspace for lapack inner calls and VecSetValues */
1257a13144ffSStefano Zampini   ierr = PetscMalloc2((5+cum+maxsize)*maxsize,&work,maxsize,&rwork);CHKERRQ(ierr);
1258a13144ffSStefano Zampini 
1259a13144ffSStefano Zampini   /* Create change of basis matrix (preallocation can be improved) */
1260a13144ffSStefano Zampini   ierr = MatCreate(comm,&T);CHKERRQ(ierr);
1261c2151214SStefano Zampini   ierr = MatSetSizes(T,pc->pmat->rmap->n,pc->pmat->rmap->n,
1262c2151214SStefano Zampini                        pc->pmat->rmap->N,pc->pmat->rmap->N);CHKERRQ(ierr);
1263a13144ffSStefano Zampini   ierr = MatSetType(T,MATAIJ);CHKERRQ(ierr);
1264a13144ffSStefano Zampini   ierr = MatSeqAIJSetPreallocation(T,10,NULL);CHKERRQ(ierr);
1265a13144ffSStefano Zampini   ierr = MatMPIAIJSetPreallocation(T,10,NULL,10,NULL);CHKERRQ(ierr);
12661e0482f5SStefano Zampini   ierr = MatSetLocalToGlobalMapping(T,al2g,al2g);CHKERRQ(ierr);
1267a13144ffSStefano Zampini   ierr = MatSetOption(T,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
1268a13144ffSStefano Zampini   ierr = MatSetOption(T,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr);
1269213b8bfaSStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&al2g);CHKERRQ(ierr);
1270a13144ffSStefano Zampini 
1271a13144ffSStefano Zampini   /* Defaults to identity */
1272c2151214SStefano Zampini   ierr = MatCreateVecs(pc->pmat,&tvec,NULL);CHKERRQ(ierr);
1273a13144ffSStefano Zampini   ierr = VecSet(tvec,1.0);CHKERRQ(ierr);
1274a13144ffSStefano Zampini   ierr = MatDiagonalSet(T,tvec,INSERT_VALUES);CHKERRQ(ierr);
1275a13144ffSStefano Zampini   ierr = VecDestroy(&tvec);CHKERRQ(ierr);
1276a13144ffSStefano Zampini 
12771e0482f5SStefano Zampini   /* Create discrete gradient for the coarser level if needed */
12781e0482f5SStefano Zampini   ierr = MatDestroy(&pcbddc->nedcG);CHKERRQ(ierr);
12791e0482f5SStefano Zampini   ierr = ISDestroy(&pcbddc->nedclocal);CHKERRQ(ierr);
12801e0482f5SStefano Zampini   if (pcbddc->current_level < pcbddc->max_levels) {
12811e0482f5SStefano Zampini     ISLocalToGlobalMapping cel2g,cvl2g;
12821e0482f5SStefano Zampini     IS                     wis,gwis;
12831e0482f5SStefano Zampini     PetscInt               cnv,cne;
12841e0482f5SStefano Zampini 
12851e0482f5SStefano Zampini     ierr = ISCreateGeneral(comm,nee,cedges,PETSC_COPY_VALUES,&wis);CHKERRQ(ierr);
12861e0482f5SStefano Zampini     if (fl2g) {
12871e0482f5SStefano Zampini       ierr = ISLocalToGlobalMappingApplyIS(fl2g,wis,&pcbddc->nedclocal);CHKERRQ(ierr);
12881e0482f5SStefano Zampini     } else {
12891e0482f5SStefano Zampini       ierr = PetscObjectReference((PetscObject)wis);CHKERRQ(ierr);
12901e0482f5SStefano Zampini       pcbddc->nedclocal = wis;
12911e0482f5SStefano Zampini     }
12921e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingApplyIS(el2g,wis,&gwis);CHKERRQ(ierr);
12931e0482f5SStefano Zampini     ierr = ISDestroy(&wis);CHKERRQ(ierr);
12941e0482f5SStefano Zampini     ierr = ISRenumber(gwis,NULL,&cne,&wis);CHKERRQ(ierr);
12951e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingCreateIS(wis,&cel2g);CHKERRQ(ierr);
12961e0482f5SStefano Zampini     ierr = ISDestroy(&wis);CHKERRQ(ierr);
12971e0482f5SStefano Zampini     ierr = ISDestroy(&gwis);CHKERRQ(ierr);
12981e0482f5SStefano Zampini 
12991e0482f5SStefano Zampini     ierr = ISCreateGeneral(comm,2*nee,corners,PETSC_USE_POINTER,&wis);CHKERRQ(ierr);
13001e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingApplyIS(vl2g,wis,&gwis);CHKERRQ(ierr);
13011e0482f5SStefano Zampini     ierr = ISDestroy(&wis);CHKERRQ(ierr);
13021e0482f5SStefano Zampini     ierr = ISRenumber(gwis,NULL,&cnv,&wis);CHKERRQ(ierr);
13031e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingCreateIS(wis,&cvl2g);CHKERRQ(ierr);
13041e0482f5SStefano Zampini     ierr = ISDestroy(&wis);CHKERRQ(ierr);
13051e0482f5SStefano Zampini     ierr = ISDestroy(&gwis);CHKERRQ(ierr);
13061e0482f5SStefano Zampini 
13071e0482f5SStefano Zampini     ierr = MatCreate(comm,&pcbddc->nedcG);CHKERRQ(ierr);
13081e0482f5SStefano Zampini     ierr = MatSetSizes(pcbddc->nedcG,PETSC_DECIDE,PETSC_DECIDE,cne,cnv);CHKERRQ(ierr);
13091e0482f5SStefano Zampini     ierr = MatSetType(pcbddc->nedcG,MATAIJ);CHKERRQ(ierr);
13101e0482f5SStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->nedcG,2,NULL);CHKERRQ(ierr);
13111e0482f5SStefano Zampini     ierr = MatMPIAIJSetPreallocation(pcbddc->nedcG,2,NULL,2,NULL);CHKERRQ(ierr);
13121e0482f5SStefano Zampini     ierr = MatSetLocalToGlobalMapping(pcbddc->nedcG,cel2g,cvl2g);CHKERRQ(ierr);
13131e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingDestroy(&cel2g);CHKERRQ(ierr);
13141e0482f5SStefano Zampini     ierr = ISLocalToGlobalMappingDestroy(&cvl2g);CHKERRQ(ierr);
13151e0482f5SStefano Zampini   }
1316213b8bfaSStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&vl2g);CHKERRQ(ierr);
13171e0482f5SStefano Zampini 
13181e0482f5SStefano Zampini #if defined(PRINT_GDET)
13191e0482f5SStefano Zampini   inc = 0;
13201e0482f5SStefano Zampini   lev = pcbddc->current_level;
13211e0482f5SStefano Zampini #endif
1322213b8bfaSStefano Zampini 
1323213b8bfaSStefano Zampini   /* Insert values in the change of basis matrix */
1324a13144ffSStefano Zampini   for (i=0;i<nee;i++) {
1325a13144ffSStefano Zampini     Mat         Gins = NULL, GKins = NULL;
13261e0482f5SStefano Zampini     IS          cornersis = NULL;
13271e0482f5SStefano Zampini     PetscScalar cvals[2];
1328a13144ffSStefano Zampini 
13291e0482f5SStefano Zampini     if (pcbddc->nedcG) {
13301e0482f5SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,2,corners+2*i,PETSC_USE_POINTER,&cornersis);CHKERRQ(ierr);
13311e0482f5SStefano Zampini     }
13321e0482f5SStefano Zampini     ierr = PCBDDCComputeNedelecChangeEdge(lG,eedges[i],extrows[i],extcols[i],cornersis,&Gins,&GKins,cvals,work,rwork);CHKERRQ(ierr);
1333a13144ffSStefano Zampini     if (Gins && GKins) {
1334a13144ffSStefano Zampini       PetscScalar    *data;
1335a13144ffSStefano Zampini       const PetscInt *rows,*cols;
1336a13144ffSStefano Zampini       PetscInt       nrh,nch,nrc,ncc;
1337a13144ffSStefano Zampini 
1338a13144ffSStefano Zampini       ierr = ISGetIndices(eedges[i],&cols);CHKERRQ(ierr);
1339a13144ffSStefano Zampini       /* H1 */
1340a13144ffSStefano Zampini       ierr = ISGetIndices(extrows[i],&rows);CHKERRQ(ierr);
1341a13144ffSStefano Zampini       ierr = MatGetSize(Gins,&nrh,&nch);CHKERRQ(ierr);
1342a13144ffSStefano Zampini       ierr = MatDenseGetArray(Gins,&data);CHKERRQ(ierr);
1343a13144ffSStefano Zampini       ierr = MatSetValuesLocal(T,nrh,rows,nch,cols,data,INSERT_VALUES);CHKERRQ(ierr);
1344a13144ffSStefano Zampini       ierr = MatDenseRestoreArray(Gins,&data);CHKERRQ(ierr);
1345a13144ffSStefano Zampini       ierr = ISRestoreIndices(extrows[i],&rows);CHKERRQ(ierr);
1346a13144ffSStefano Zampini       /* complement */
1347a13144ffSStefano Zampini       ierr = MatGetSize(GKins,&nrc,&ncc);CHKERRQ(ierr);
13481e0482f5SStefano Zampini       if (!ncc) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Constant function has not been generated for coarse edge %d",i);
1349213b8bfaSStefano Zampini       if (ncc + nch != nrc) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"The sum of the number of columns of GKins %d and Gins %d does not match %d for coarse edge %d",ncc,nch,nrc,i);
1350213b8bfaSStefano Zampini       if (ncc != 1 && pcbddc->nedcG) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot generate the coarse discrete gradient for coarse edge %d with ncc %d",i,ncc);
1351a13144ffSStefano Zampini       ierr = MatDenseGetArray(GKins,&data);CHKERRQ(ierr);
1352a13144ffSStefano Zampini       ierr = MatSetValuesLocal(T,nrc,cols,ncc,cols+nch,data,INSERT_VALUES);CHKERRQ(ierr);
1353a13144ffSStefano Zampini       ierr = MatDenseRestoreArray(GKins,&data);CHKERRQ(ierr);
13541e0482f5SStefano Zampini 
13551e0482f5SStefano Zampini       /* coarse discrete gradient */
13561e0482f5SStefano Zampini       if (pcbddc->nedcG) {
13571e0482f5SStefano Zampini         PetscInt cols[2];
13581e0482f5SStefano Zampini 
13591e0482f5SStefano Zampini         cols[0] = 2*i;
13601e0482f5SStefano Zampini         cols[1] = 2*i+1;
13611e0482f5SStefano Zampini         ierr = MatSetValuesLocal(pcbddc->nedcG,1,&i,2,cols,cvals,INSERT_VALUES);CHKERRQ(ierr);
13621e0482f5SStefano Zampini       }
1363a13144ffSStefano Zampini       ierr = ISRestoreIndices(eedges[i],&cols);CHKERRQ(ierr);
1364a13144ffSStefano Zampini     }
1365a13144ffSStefano Zampini     ierr = ISDestroy(&extrows[i]);CHKERRQ(ierr);
1366a13144ffSStefano Zampini     ierr = ISDestroy(&extcols[i]);CHKERRQ(ierr);
13671e0482f5SStefano Zampini     ierr = ISDestroy(&cornersis);CHKERRQ(ierr);
1368a13144ffSStefano Zampini     ierr = MatDestroy(&Gins);CHKERRQ(ierr);
1369a13144ffSStefano Zampini     ierr = MatDestroy(&GKins);CHKERRQ(ierr);
1370a13144ffSStefano Zampini   }
1371213b8bfaSStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&el2g);CHKERRQ(ierr);
1372a13144ffSStefano Zampini 
1373a13144ffSStefano Zampini   /* Start assembling */
1374a13144ffSStefano Zampini   ierr = MatAssemblyBegin(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
13751e0482f5SStefano Zampini   if (pcbddc->nedcG) {
13761e0482f5SStefano Zampini     ierr = MatAssemblyBegin(pcbddc->nedcG,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
13771e0482f5SStefano Zampini   }
1378a13144ffSStefano Zampini 
1379a13144ffSStefano Zampini   /* Free */
1380c2151214SStefano Zampini   if (fl2g) {
1381c2151214SStefano Zampini     ierr = ISDestroy(&primals);CHKERRQ(ierr);
1382c2151214SStefano Zampini     for (i=0;i<nee;i++) {
1383c2151214SStefano Zampini       ierr = ISDestroy(&eedges[i]);CHKERRQ(ierr);
1384c2151214SStefano Zampini     }
1385c2151214SStefano Zampini     ierr = PetscFree(eedges);CHKERRQ(ierr);
1386c2151214SStefano Zampini   }
1387eee23b56SStefano Zampini 
1388eee23b56SStefano Zampini   /* hack mat_graph with primal dofs on the coarse edges */
1389eee23b56SStefano Zampini   {
1390eee23b56SStefano Zampini     PCBDDCGraph graph   = pcbddc->mat_graph;
1391eee23b56SStefano Zampini     PetscInt    *oqueue = graph->queue;
1392eee23b56SStefano Zampini     PetscInt    *ocptr  = graph->cptr;
1393eee23b56SStefano Zampini     PetscInt    ncc,*idxs;
1394eee23b56SStefano Zampini 
1395eee23b56SStefano Zampini     /* find first primal edge */
1396eee23b56SStefano Zampini     if (pcbddc->nedclocal) {
1397eee23b56SStefano Zampini       ierr = ISGetIndices(pcbddc->nedclocal,(const PetscInt**)&idxs);CHKERRQ(ierr);
1398eee23b56SStefano Zampini     } else {
1399eee23b56SStefano Zampini       if (fl2g) {
1400eee23b56SStefano Zampini         ierr = ISLocalToGlobalMappingApply(fl2g,nee,cedges,cedges);CHKERRQ(ierr);
1401eee23b56SStefano Zampini       }
1402eee23b56SStefano Zampini       idxs = cedges;
1403eee23b56SStefano Zampini     }
1404eee23b56SStefano Zampini     cum = 0;
1405eee23b56SStefano Zampini     while (cum < nee && cedges[cum] < 0) cum++;
1406eee23b56SStefano Zampini 
1407eee23b56SStefano Zampini     /* adapt connected components */
1408eee23b56SStefano Zampini     ierr = PetscMalloc2(graph->nvtxs+1,&graph->cptr,ocptr[graph->ncc],&graph->queue);CHKERRQ(ierr);
1409eee23b56SStefano Zampini     graph->cptr[0] = 0;
1410eee23b56SStefano Zampini     for (i=0,ncc=0;i<graph->ncc;i++) {
1411eee23b56SStefano Zampini       PetscInt lc = ocptr[i+1]-ocptr[i];
1412eee23b56SStefano Zampini       if (cum != nee && oqueue[ocptr[i+1]-1] == cedges[cum]) { /* this cc has a primal dof */
1413eee23b56SStefano Zampini         graph->cptr[ncc+1] = graph->cptr[ncc]+1;
1414eee23b56SStefano Zampini         graph->queue[graph->cptr[ncc]] = cedges[cum];
1415eee23b56SStefano Zampini         ncc++;
1416eee23b56SStefano Zampini         lc--;
1417eee23b56SStefano Zampini         cum++;
1418eee23b56SStefano Zampini         while (cum < nee && cedges[cum] < 0) cum++;
1419eee23b56SStefano Zampini       }
1420eee23b56SStefano Zampini       graph->cptr[ncc+1] = graph->cptr[ncc] + lc;
1421eee23b56SStefano Zampini       for (j=0;j<lc;j++) graph->queue[graph->cptr[ncc]+j] = oqueue[ocptr[i]+j];
1422eee23b56SStefano Zampini       ncc++;
1423eee23b56SStefano Zampini     }
1424eee23b56SStefano Zampini     graph->ncc = ncc;
1425eee23b56SStefano Zampini     if (pcbddc->nedclocal) {
1426eee23b56SStefano Zampini       ierr = ISRestoreIndices(pcbddc->nedclocal,(const PetscInt**)&idxs);CHKERRQ(ierr);
1427eee23b56SStefano Zampini     }
1428eee23b56SStefano Zampini     ierr = PetscFree2(ocptr,oqueue);CHKERRQ(ierr);
1429eee23b56SStefano Zampini   }
1430213b8bfaSStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&fl2g);CHKERRQ(ierr);
1431c2151214SStefano Zampini   ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr);
1432c2151214SStefano Zampini   ierr = PCBDDCGraphResetCSR(pcbddc->mat_graph);CHKERRQ(ierr);
1433213b8bfaSStefano Zampini   ierr = MatDestroy(&conn);CHKERRQ(ierr);
1434eee23b56SStefano Zampini 
1435c2151214SStefano Zampini   ierr = ISDestroy(&nedfieldlocal);CHKERRQ(ierr);
1436a13144ffSStefano Zampini   ierr = PetscFree(extrow);CHKERRQ(ierr);
1437a13144ffSStefano Zampini   ierr = PetscFree2(work,rwork);CHKERRQ(ierr);
1438b03ebc13SStefano Zampini   ierr = PetscFree(corners);CHKERRQ(ierr);
1439b03ebc13SStefano Zampini   ierr = PetscFree(cedges);CHKERRQ(ierr);
1440a13144ffSStefano Zampini   ierr = PetscFree(extrows);CHKERRQ(ierr);
1441a13144ffSStefano Zampini   ierr = PetscFree(extcols);CHKERRQ(ierr);
1442a13144ffSStefano Zampini   ierr = MatDestroy(&lG);CHKERRQ(ierr);
1443a13144ffSStefano Zampini 
1444a13144ffSStefano Zampini   /* Complete assembling */
1445a13144ffSStefano Zampini   ierr = MatAssemblyEnd(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
14461e0482f5SStefano Zampini   if (pcbddc->nedcG) {
14471e0482f5SStefano Zampini     ierr = MatAssemblyEnd(pcbddc->nedcG,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
14481e0482f5SStefano Zampini #if 0
14491e0482f5SStefano Zampini     ierr = PetscObjectSetName((PetscObject)pcbddc->nedcG,"coarse_G");CHKERRQ(ierr);
14501e0482f5SStefano Zampini     ierr = MatView(pcbddc->nedcG,NULL);CHKERRQ(ierr);
14511e0482f5SStefano Zampini #endif
14521e0482f5SStefano Zampini   }
1453a13144ffSStefano Zampini 
1454a13144ffSStefano Zampini   /* set change of basis */
1455213b8bfaSStefano Zampini   ierr = PCBDDCSetChangeOfBasisMat(pc,T,singular);CHKERRQ(ierr);
1456a13144ffSStefano Zampini   ierr = MatDestroy(&T);CHKERRQ(ierr);
1457a13144ffSStefano Zampini 
1458a13144ffSStefano Zampini   PetscFunctionReturn(0);
1459a13144ffSStefano Zampini }
1460a13144ffSStefano Zampini 
1461d8203eabSStefano Zampini /* the near-null space of BDDC carries information on quadrature weights,
1462d8203eabSStefano Zampini    and these can be collinear -> so cheat with MatNullSpaceCreate
1463d8203eabSStefano Zampini    and create a suitable set of basis vectors first */
1464d8203eabSStefano Zampini PetscErrorCode PCBDDCNullSpaceCreate(MPI_Comm comm, PetscBool has_const, PetscInt nvecs, Vec quad_vecs[], MatNullSpace *nnsp)
1465d8203eabSStefano Zampini {
1466d8203eabSStefano Zampini   PetscErrorCode ierr;
1467d8203eabSStefano Zampini   PetscInt       i;
1468d8203eabSStefano Zampini 
1469d8203eabSStefano Zampini   PetscFunctionBegin;
1470d8203eabSStefano Zampini   for (i=0;i<nvecs;i++) {
1471d8203eabSStefano Zampini     PetscInt first,last;
1472d8203eabSStefano Zampini 
1473d8203eabSStefano Zampini     ierr = VecGetOwnershipRange(quad_vecs[i],&first,&last);CHKERRQ(ierr);
147486fa73c5SStefano Zampini     if (last-first < 2*nvecs && has_const) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented");
1475d8203eabSStefano Zampini     if (i>=first && i < last) {
1476d8203eabSStefano Zampini       PetscScalar *data;
1477d8203eabSStefano Zampini       ierr = VecGetArray(quad_vecs[i],&data);CHKERRQ(ierr);
1478d8203eabSStefano Zampini       if (!has_const) {
1479d8203eabSStefano Zampini         data[i-first] = 1.;
1480d8203eabSStefano Zampini       } else {
148186fa73c5SStefano Zampini         data[2*i-first] = 1./PetscSqrtReal(2.);
148286fa73c5SStefano Zampini         data[2*i-first+1] = -1./PetscSqrtReal(2.);
1483d8203eabSStefano Zampini       }
1484d8203eabSStefano Zampini       ierr = VecRestoreArray(quad_vecs[i],&data);CHKERRQ(ierr);
1485d8203eabSStefano Zampini     }
1486d8203eabSStefano Zampini     ierr = PetscObjectStateIncrease((PetscObject)quad_vecs[i]);CHKERRQ(ierr);
1487d8203eabSStefano Zampini   }
1488d8203eabSStefano Zampini   ierr = MatNullSpaceCreate(comm,has_const,nvecs,quad_vecs,nnsp);CHKERRQ(ierr);
1489d8203eabSStefano Zampini   for (i=0;i<nvecs;i++) { /* reset vectors */
1490d8203eabSStefano Zampini     PetscInt first,last;
1491ddc40e2cSstefano_zampini     ierr = VecLockPop(quad_vecs[i]);CHKERRQ(ierr);
1492d8203eabSStefano Zampini     ierr = VecGetOwnershipRange(quad_vecs[i],&first,&last);CHKERRQ(ierr);
1493d8203eabSStefano Zampini     if (i>=first && i < last) {
1494d8203eabSStefano Zampini       PetscScalar *data;
1495d8203eabSStefano Zampini       ierr = VecGetArray(quad_vecs[i],&data);CHKERRQ(ierr);
1496d8203eabSStefano Zampini       if (!has_const) {
1497d8203eabSStefano Zampini         data[i-first] = 0.;
1498d8203eabSStefano Zampini       } else {
149986fa73c5SStefano Zampini         data[2*i-first] = 0.;
150086fa73c5SStefano Zampini         data[2*i-first+1] = 0.;
1501d8203eabSStefano Zampini       }
1502d8203eabSStefano Zampini       ierr = VecRestoreArray(quad_vecs[i],&data);CHKERRQ(ierr);
1503d8203eabSStefano Zampini     }
1504d8203eabSStefano Zampini     ierr = PetscObjectStateIncrease((PetscObject)quad_vecs[i]);CHKERRQ(ierr);
1505ddc40e2cSstefano_zampini     ierr = VecLockPush(quad_vecs[i]);CHKERRQ(ierr);
1506d8203eabSStefano Zampini   }
1507d8203eabSStefano Zampini   PetscFunctionReturn(0);
1508d8203eabSStefano Zampini }
1509d8203eabSStefano Zampini 
15108ae0ca82SStefano Zampini PetscErrorCode PCBDDCComputeNoNetFlux(Mat A, Mat divudotp, PetscBool transpose, IS vl2l, PCBDDCGraph graph, MatNullSpace *nnsp)
1511669cc0f4SStefano Zampini {
1512a198735bSStefano Zampini   Mat                    loc_divudotp;
1513fa23a32eSStefano Zampini   Vec                    p,v,vins,quad_vec,*quad_vecs;
15148ae0ca82SStefano Zampini   ISLocalToGlobalMapping map;
1515669cc0f4SStefano Zampini   IS                     *faces,*edges;
1516669cc0f4SStefano Zampini   PetscScalar            *vals;
1517669cc0f4SStefano Zampini   const PetscScalar      *array;
1518669cc0f4SStefano Zampini   PetscInt               i,maxneighs,lmaxneighs,maxsize,nf,ne;
15191ae86dd6SStefano Zampini   PetscMPIInt            rank;
1520a198735bSStefano Zampini   PetscErrorCode         ierr;
1521669cc0f4SStefano Zampini 
1522669cc0f4SStefano Zampini   PetscFunctionBegin;
1523669cc0f4SStefano Zampini   ierr = PCBDDCGraphGetCandidatesIS(graph,&nf,&faces,&ne,&edges,NULL);CHKERRQ(ierr);
1524669cc0f4SStefano Zampini   if (graph->twodim) {
1525669cc0f4SStefano Zampini     lmaxneighs = 2;
1526669cc0f4SStefano Zampini   } else {
1527669cc0f4SStefano Zampini     lmaxneighs = 1;
1528669cc0f4SStefano Zampini     for (i=0;i<ne;i++) {
1529669cc0f4SStefano Zampini       const PetscInt *idxs;
1530669cc0f4SStefano Zampini       ierr = ISGetIndices(edges[i],&idxs);CHKERRQ(ierr);
1531669cc0f4SStefano Zampini       lmaxneighs = PetscMax(lmaxneighs,graph->count[idxs[0]]);
1532669cc0f4SStefano Zampini       ierr = ISRestoreIndices(edges[i],&idxs);CHKERRQ(ierr);
1533669cc0f4SStefano Zampini     }
1534669cc0f4SStefano Zampini     lmaxneighs++; /* graph count does not include self */
1535669cc0f4SStefano Zampini   }
1536669cc0f4SStefano Zampini   ierr = MPIU_Allreduce(&lmaxneighs,&maxneighs,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)A));CHKERRQ(ierr);
1537669cc0f4SStefano Zampini   maxsize = 0;
1538669cc0f4SStefano Zampini   for (i=0;i<ne;i++) {
1539669cc0f4SStefano Zampini     PetscInt nn;
1540669cc0f4SStefano Zampini     ierr = ISGetLocalSize(edges[i],&nn);CHKERRQ(ierr);
1541669cc0f4SStefano Zampini     maxsize = PetscMax(maxsize,nn);
1542669cc0f4SStefano Zampini   }
1543669cc0f4SStefano Zampini   for (i=0;i<nf;i++) {
1544669cc0f4SStefano Zampini     PetscInt nn;
1545669cc0f4SStefano Zampini     ierr = ISGetLocalSize(faces[i],&nn);CHKERRQ(ierr);
1546669cc0f4SStefano Zampini     maxsize = PetscMax(maxsize,nn);
1547669cc0f4SStefano Zampini   }
1548669cc0f4SStefano Zampini   ierr = PetscMalloc1(maxsize,&vals);CHKERRQ(ierr);
1549669cc0f4SStefano Zampini   /* create vectors to hold quadrature weights */
1550669cc0f4SStefano Zampini   ierr = MatCreateVecs(A,&quad_vec,NULL);CHKERRQ(ierr);
15518ae0ca82SStefano Zampini   if (!transpose) {
15528ae0ca82SStefano Zampini     ierr = MatGetLocalToGlobalMapping(A,&map,NULL);CHKERRQ(ierr);
15538ae0ca82SStefano Zampini   } else {
15548ae0ca82SStefano Zampini     ierr = MatGetLocalToGlobalMapping(A,NULL,&map);CHKERRQ(ierr);
15558ae0ca82SStefano Zampini   }
1556669cc0f4SStefano Zampini   ierr = VecDuplicateVecs(quad_vec,maxneighs,&quad_vecs);CHKERRQ(ierr);
15571ae86dd6SStefano Zampini   ierr = VecDestroy(&quad_vec);CHKERRQ(ierr);
1558d8203eabSStefano Zampini   ierr = PCBDDCNullSpaceCreate(PetscObjectComm((PetscObject)A),PETSC_FALSE,maxneighs,quad_vecs,nnsp);CHKERRQ(ierr);
1559669cc0f4SStefano Zampini   for (i=0;i<maxneighs;i++) {
1560ddc40e2cSstefano_zampini     ierr = VecLockPop(quad_vecs[i]);CHKERRQ(ierr);
15618ae0ca82SStefano Zampini     ierr = VecSetLocalToGlobalMapping(quad_vecs[i],map);CHKERRQ(ierr);
1562669cc0f4SStefano Zampini   }
1563d8203eabSStefano Zampini 
1564669cc0f4SStefano Zampini   /* compute local quad vec */
1565a198735bSStefano Zampini   ierr = MatISGetLocalMat(divudotp,&loc_divudotp);CHKERRQ(ierr);
15668ae0ca82SStefano Zampini   if (!transpose) {
1567a198735bSStefano Zampini     ierr = MatCreateVecs(loc_divudotp,&v,&p);CHKERRQ(ierr);
15688ae0ca82SStefano Zampini   } else {
15698ae0ca82SStefano Zampini     ierr = MatCreateVecs(loc_divudotp,&p,&v);CHKERRQ(ierr);
15708ae0ca82SStefano Zampini   }
1571669cc0f4SStefano Zampini   ierr = VecSet(p,1.);CHKERRQ(ierr);
15728ae0ca82SStefano Zampini   if (!transpose) {
1573a198735bSStefano Zampini     ierr = MatMultTranspose(loc_divudotp,p,v);CHKERRQ(ierr);
15748ae0ca82SStefano Zampini   } else {
15758ae0ca82SStefano Zampini     ierr = MatMult(loc_divudotp,p,v);CHKERRQ(ierr);
15768ae0ca82SStefano Zampini   }
1577fa23a32eSStefano Zampini   if (vl2l) {
1578187c917aSStefano Zampini     Mat        lA;
1579187c917aSStefano Zampini     VecScatter sc;
1580187c917aSStefano Zampini 
1581187c917aSStefano Zampini     ierr = MatISGetLocalMat(A,&lA);CHKERRQ(ierr);
1582187c917aSStefano Zampini     ierr = MatCreateVecs(lA,&vins,NULL);CHKERRQ(ierr);
1583187c917aSStefano Zampini     ierr = VecScatterCreate(v,vl2l,vins,NULL,&sc);CHKERRQ(ierr);
1584187c917aSStefano Zampini     ierr = VecScatterBegin(sc,v,vins,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1585187c917aSStefano Zampini     ierr = VecScatterEnd(sc,v,vins,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1586187c917aSStefano Zampini     ierr = VecScatterDestroy(&sc);CHKERRQ(ierr);
1587fa23a32eSStefano Zampini   } else {
1588fa23a32eSStefano Zampini     vins = v;
1589fa23a32eSStefano Zampini   }
1590fa23a32eSStefano Zampini   ierr = VecGetArrayRead(vins,&array);CHKERRQ(ierr);
1591669cc0f4SStefano Zampini   ierr = VecDestroy(&p);CHKERRQ(ierr);
15929a962809SStefano Zampini 
15931ae86dd6SStefano Zampini   /* insert in global quadrature vecs */
15941ae86dd6SStefano Zampini   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A),&rank);CHKERRQ(ierr);
1595669cc0f4SStefano Zampini   for (i=0;i<nf;i++) {
1596669cc0f4SStefano Zampini     const PetscInt    *idxs;
1597669cc0f4SStefano Zampini     PetscInt          idx,nn,j;
1598669cc0f4SStefano Zampini 
1599669cc0f4SStefano Zampini     ierr = ISGetIndices(faces[i],&idxs);CHKERRQ(ierr);
1600669cc0f4SStefano Zampini     ierr = ISGetLocalSize(faces[i],&nn);CHKERRQ(ierr);
1601669cc0f4SStefano Zampini     for (j=0;j<nn;j++) vals[j] = array[idxs[j]];
16021ae86dd6SStefano Zampini     ierr = PetscFindInt(rank,graph->count[idxs[0]],graph->neighbours_set[idxs[0]],&idx);CHKERRQ(ierr);
1603669cc0f4SStefano Zampini     idx  = -(idx+1);
1604669cc0f4SStefano Zampini     ierr = VecSetValuesLocal(quad_vecs[idx],nn,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
1605669cc0f4SStefano Zampini     ierr = ISRestoreIndices(faces[i],&idxs);CHKERRQ(ierr);
1606669cc0f4SStefano Zampini   }
1607669cc0f4SStefano Zampini   for (i=0;i<ne;i++) {
1608669cc0f4SStefano Zampini     const PetscInt    *idxs;
1609669cc0f4SStefano Zampini     PetscInt          idx,nn,j;
1610669cc0f4SStefano Zampini 
1611669cc0f4SStefano Zampini     ierr = ISGetIndices(edges[i],&idxs);CHKERRQ(ierr);
1612669cc0f4SStefano Zampini     ierr = ISGetLocalSize(edges[i],&nn);CHKERRQ(ierr);
1613669cc0f4SStefano Zampini     for (j=0;j<nn;j++) vals[j] = array[idxs[j]];
16141ae86dd6SStefano Zampini     ierr = PetscFindInt(rank,graph->count[idxs[0]],graph->neighbours_set[idxs[0]],&idx);CHKERRQ(ierr);
1615669cc0f4SStefano Zampini     idx  = -(idx+1);
1616669cc0f4SStefano Zampini     ierr = VecSetValuesLocal(quad_vecs[idx],nn,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
1617669cc0f4SStefano Zampini     ierr = ISRestoreIndices(edges[i],&idxs);CHKERRQ(ierr);
1618669cc0f4SStefano Zampini   }
1619c8272957SStefano Zampini   ierr = PCBDDCGraphRestoreCandidatesIS(graph,&nf,&faces,&ne,&edges,NULL);CHKERRQ(ierr);
1620fa23a32eSStefano Zampini   ierr = VecRestoreArrayRead(vins,&array);CHKERRQ(ierr);
1621fa23a32eSStefano Zampini   if (vl2l) {
1622187c917aSStefano Zampini     ierr = VecDestroy(&vins);CHKERRQ(ierr);
1623fa23a32eSStefano Zampini   }
1624669cc0f4SStefano Zampini   ierr = VecDestroy(&v);CHKERRQ(ierr);
1625669cc0f4SStefano Zampini   ierr = PetscFree(vals);CHKERRQ(ierr);
1626669cc0f4SStefano Zampini 
1627669cc0f4SStefano Zampini   /* assemble near null space */
1628669cc0f4SStefano Zampini   for (i=0;i<maxneighs;i++) {
1629669cc0f4SStefano Zampini     ierr = VecAssemblyBegin(quad_vecs[i]);CHKERRQ(ierr);
1630669cc0f4SStefano Zampini   }
1631669cc0f4SStefano Zampini   for (i=0;i<maxneighs;i++) {
1632669cc0f4SStefano Zampini     ierr = VecAssemblyEnd(quad_vecs[i]);CHKERRQ(ierr);
1633ddc40e2cSstefano_zampini     ierr = VecLockPush(quad_vecs[i]);CHKERRQ(ierr);
1634669cc0f4SStefano Zampini   }
1635669cc0f4SStefano Zampini   ierr = VecDestroyVecs(maxneighs,&quad_vecs);CHKERRQ(ierr);
1636669cc0f4SStefano Zampini   PetscFunctionReturn(0);
1637669cc0f4SStefano Zampini }
1638669cc0f4SStefano Zampini 
1639669cc0f4SStefano Zampini 
16401f4df5f7SStefano Zampini PetscErrorCode PCBDDCComputeLocalTopologyInfo(PC pc)
16411f4df5f7SStefano Zampini {
16421f4df5f7SStefano Zampini   PetscErrorCode ierr;
16431f4df5f7SStefano Zampini   Vec            local,global;
16441f4df5f7SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
16451f4df5f7SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
16465c5e10d6SStefano Zampini   PetscBool      monolithic = PETSC_FALSE;
16471f4df5f7SStefano Zampini 
16481f4df5f7SStefano Zampini   PetscFunctionBegin;
16495c5e10d6SStefano Zampini   ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC topology options","PC");CHKERRQ(ierr);
16505c5e10d6SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_monolithic","Discard any information on dofs splitting",NULL,monolithic,&monolithic,NULL);CHKERRQ(ierr);
16515c5e10d6SStefano Zampini   ierr = PetscOptionsEnd();CHKERRQ(ierr);
16521f4df5f7SStefano Zampini   /* need to convert from global to local topology information and remove references to information in global ordering */
165321ef3d20SStefano Zampini   ierr = MatCreateVecs(pc->pmat,&global,NULL);CHKERRQ(ierr);
16541f4df5f7SStefano Zampini   ierr = MatCreateVecs(matis->A,&local,NULL);CHKERRQ(ierr);
16555c5e10d6SStefano Zampini   if (monolithic) goto boundary;
16565c5e10d6SStefano Zampini 
16571f4df5f7SStefano Zampini   if (pcbddc->user_provided_isfordofs) {
16581f4df5f7SStefano Zampini     if (pcbddc->n_ISForDofs) {
16591f4df5f7SStefano Zampini       PetscInt i;
16601f4df5f7SStefano Zampini       ierr = PetscMalloc1(pcbddc->n_ISForDofs,&pcbddc->ISForDofsLocal);CHKERRQ(ierr);
16611f4df5f7SStefano Zampini       for (i=0;i<pcbddc->n_ISForDofs;i++) {
16621f4df5f7SStefano Zampini         ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->ISForDofs[i],&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr);
16631f4df5f7SStefano Zampini         ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
16641f4df5f7SStefano Zampini       }
16651f4df5f7SStefano Zampini       pcbddc->n_ISForDofsLocal = pcbddc->n_ISForDofs;
16661f4df5f7SStefano Zampini       pcbddc->n_ISForDofs = 0;
16671f4df5f7SStefano Zampini       ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
16681f4df5f7SStefano Zampini     }
16691f4df5f7SStefano Zampini   } else {
167021ef3d20SStefano Zampini     if (!pcbddc->n_ISForDofsLocal) { /* field split not present */
167121ef3d20SStefano Zampini       DM dm;
167221ef3d20SStefano Zampini 
167321ef3d20SStefano Zampini       ierr = PCGetDM(pc, &dm);CHKERRQ(ierr);
167421ef3d20SStefano Zampini       if (!dm) {
167521ef3d20SStefano Zampini         ierr = MatGetDM(pc->pmat, &dm);CHKERRQ(ierr);
167621ef3d20SStefano Zampini       }
167721ef3d20SStefano Zampini       if (dm) {
167821ef3d20SStefano Zampini         IS      *fields;
167921ef3d20SStefano Zampini         PetscInt nf,i;
168021ef3d20SStefano Zampini         ierr = DMCreateFieldDecomposition(dm,&nf,NULL,&fields,NULL);CHKERRQ(ierr);
168121ef3d20SStefano Zampini         ierr = PetscMalloc1(nf,&pcbddc->ISForDofsLocal);CHKERRQ(ierr);
168221ef3d20SStefano Zampini         for (i=0;i<nf;i++) {
168321ef3d20SStefano Zampini           ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,fields[i],&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr);
168421ef3d20SStefano Zampini           ierr = ISDestroy(&fields[i]);CHKERRQ(ierr);
168521ef3d20SStefano Zampini         }
168621ef3d20SStefano Zampini         ierr = PetscFree(fields);CHKERRQ(ierr);
168721ef3d20SStefano Zampini         pcbddc->n_ISForDofsLocal = nf;
168821ef3d20SStefano Zampini       } else { /* See if MATIS has fields attached by the conversion from MatNest */
168921ef3d20SStefano Zampini         PetscContainer   c;
169021ef3d20SStefano Zampini 
169121ef3d20SStefano Zampini         ierr = PetscObjectQuery((PetscObject)pc->pmat,"_convert_nest_lfields",(PetscObject*)&c);CHKERRQ(ierr);
169221ef3d20SStefano Zampini         if (c) {
169321ef3d20SStefano Zampini           MatISLocalFields lf;
169421ef3d20SStefano Zampini           ierr = PetscContainerGetPointer(c,(void**)&lf);CHKERRQ(ierr);
169521ef3d20SStefano Zampini           ierr = PCBDDCSetDofsSplittingLocal(pc,lf->nr,lf->rf);CHKERRQ(ierr);
169621ef3d20SStefano Zampini         } else { /* fallback, create the default fields if bs > 1 */
16971f4df5f7SStefano Zampini           PetscInt i, n = matis->A->rmap->n;
1698986cdee1SStefano Zampini           ierr = MatGetBlockSize(pc->pmat,&i);CHKERRQ(ierr);
169921ef3d20SStefano Zampini           if (i > 1) {
1700986cdee1SStefano Zampini             pcbddc->n_ISForDofsLocal = i;
17011f4df5f7SStefano Zampini             ierr = PetscMalloc1(pcbddc->n_ISForDofsLocal,&pcbddc->ISForDofsLocal);CHKERRQ(ierr);
17021f4df5f7SStefano Zampini             for (i=0;i<pcbddc->n_ISForDofsLocal;i++) {
17031f4df5f7SStefano Zampini               ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n/pcbddc->n_ISForDofsLocal,i,pcbddc->n_ISForDofsLocal,&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr);
17041f4df5f7SStefano Zampini             }
17051f4df5f7SStefano Zampini           }
170621ef3d20SStefano Zampini         }
170721ef3d20SStefano Zampini       }
17087a0e7b2cSstefano_zampini     } else {
17097a0e7b2cSstefano_zampini       PetscInt i;
17107a0e7b2cSstefano_zampini       for (i=0;i<pcbddc->n_ISForDofsLocal;i++) {
17117a0e7b2cSstefano_zampini         ierr = PCBDDCConsistencyCheckIS(pc,MPI_LAND,&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr);
17127a0e7b2cSstefano_zampini       }
17131f4df5f7SStefano Zampini     }
1714986cdee1SStefano Zampini   }
17151f4df5f7SStefano Zampini 
17165c5e10d6SStefano Zampini boundary:
17171f4df5f7SStefano Zampini   if (!pcbddc->DirichletBoundariesLocal && pcbddc->DirichletBoundaries) {
17181f4df5f7SStefano Zampini     ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->DirichletBoundaries,&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr);
17197a0e7b2cSstefano_zampini   } else if (pcbddc->DirichletBoundariesLocal) {
17207a0e7b2cSstefano_zampini     ierr = PCBDDCConsistencyCheckIS(pc,MPI_LAND,&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr);
17211f4df5f7SStefano Zampini   }
17221f4df5f7SStefano Zampini   if (!pcbddc->NeumannBoundariesLocal && pcbddc->NeumannBoundaries) {
17231f4df5f7SStefano Zampini     ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->NeumannBoundaries,&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr);
17247a0e7b2cSstefano_zampini   } else if (pcbddc->NeumannBoundariesLocal) {
17257a0e7b2cSstefano_zampini     ierr = PCBDDCConsistencyCheckIS(pc,MPI_LOR,&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr);
17261f4df5f7SStefano Zampini   }
17271f4df5f7SStefano Zampini   if (!pcbddc->user_primal_vertices_local && pcbddc->user_primal_vertices) {
17281f4df5f7SStefano Zampini     ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->user_primal_vertices,&pcbddc->user_primal_vertices_local);CHKERRQ(ierr);
17291f4df5f7SStefano Zampini   }
17301f4df5f7SStefano Zampini   ierr = VecDestroy(&global);CHKERRQ(ierr);
17311f4df5f7SStefano Zampini   ierr = VecDestroy(&local);CHKERRQ(ierr);
17327a0e7b2cSstefano_zampini 
17337a0e7b2cSstefano_zampini   PetscFunctionReturn(0);
17347a0e7b2cSstefano_zampini }
17357a0e7b2cSstefano_zampini 
17367a0e7b2cSstefano_zampini PetscErrorCode PCBDDCConsistencyCheckIS(PC pc, MPI_Op mop, IS *is)
17377a0e7b2cSstefano_zampini {
17387a0e7b2cSstefano_zampini   Mat_IS          *matis = (Mat_IS*)(pc->pmat->data);
17397a0e7b2cSstefano_zampini   PetscErrorCode  ierr;
17407a0e7b2cSstefano_zampini   IS              nis;
17417a0e7b2cSstefano_zampini   const PetscInt  *idxs;
17427a0e7b2cSstefano_zampini   PetscInt        i,nd,n = matis->A->rmap->n,*nidxs,nnd;
17437a0e7b2cSstefano_zampini   PetscBool       *ld;
17447a0e7b2cSstefano_zampini 
17457a0e7b2cSstefano_zampini   PetscFunctionBegin;
17467a0e7b2cSstefano_zampini   if (mop != MPI_LAND && mop != MPI_LOR) SETERRQ(PetscObjectComm((PetscObject)(pc)),PETSC_ERR_SUP,"Supported are MPI_LAND and MPI_LOR");
17477a0e7b2cSstefano_zampini   ierr = MatISSetUpSF(pc->pmat);CHKERRQ(ierr);
17487a0e7b2cSstefano_zampini   if (mop == MPI_LAND) {
17497a0e7b2cSstefano_zampini     /* init rootdata with true */
17507a0e7b2cSstefano_zampini     ld   = (PetscBool*) matis->sf_rootdata;
17517a0e7b2cSstefano_zampini     for (i=0;i<pc->pmat->rmap->n;i++) ld[i] = PETSC_TRUE;
17527a0e7b2cSstefano_zampini   } else {
17537a0e7b2cSstefano_zampini     ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscBool));CHKERRQ(ierr);
17547a0e7b2cSstefano_zampini   }
17557a0e7b2cSstefano_zampini   ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscBool));CHKERRQ(ierr);
17567a0e7b2cSstefano_zampini   ierr = ISGetLocalSize(*is,&nd);CHKERRQ(ierr);
17577a0e7b2cSstefano_zampini   ierr = ISGetIndices(*is,&idxs);CHKERRQ(ierr);
17587a0e7b2cSstefano_zampini   ld   = (PetscBool*) matis->sf_leafdata;
17597a0e7b2cSstefano_zampini   for (i=0;i<nd;i++)
17607a0e7b2cSstefano_zampini     if (-1 < idxs[i] && idxs[i] < n)
17617a0e7b2cSstefano_zampini       ld[idxs[i]] = PETSC_TRUE;
17627a0e7b2cSstefano_zampini   ierr = ISRestoreIndices(*is,&idxs);CHKERRQ(ierr);
17637a0e7b2cSstefano_zampini   ierr = PetscSFReduceBegin(matis->sf,MPIU_BOOL,matis->sf_leafdata,matis->sf_rootdata,mop);CHKERRQ(ierr);
17647a0e7b2cSstefano_zampini   ierr = PetscSFReduceEnd(matis->sf,MPIU_BOOL,matis->sf_leafdata,matis->sf_rootdata,mop);CHKERRQ(ierr);
17657a0e7b2cSstefano_zampini   ierr = PetscSFBcastBegin(matis->sf,MPIU_BOOL,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr);
17667a0e7b2cSstefano_zampini   ierr = PetscSFBcastEnd(matis->sf,MPIU_BOOL,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr);
17677a0e7b2cSstefano_zampini   if (mop == MPI_LAND) {
17687a0e7b2cSstefano_zampini     ierr = PetscMalloc1(nd,&nidxs);CHKERRQ(ierr);
17697a0e7b2cSstefano_zampini   } else {
17707a0e7b2cSstefano_zampini     ierr = PetscMalloc1(n,&nidxs);CHKERRQ(ierr);
17717a0e7b2cSstefano_zampini   }
17727a0e7b2cSstefano_zampini   for (i=0,nnd=0;i<n;i++)
17737a0e7b2cSstefano_zampini     if (ld[i])
17747a0e7b2cSstefano_zampini       nidxs[nnd++] = i;
17757a0e7b2cSstefano_zampini   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(*is)),nnd,nidxs,PETSC_OWN_POINTER,&nis);CHKERRQ(ierr);
17767a0e7b2cSstefano_zampini   ierr = ISDestroy(is);CHKERRQ(ierr);
17777a0e7b2cSstefano_zampini   *is  = nis;
17781f4df5f7SStefano Zampini   PetscFunctionReturn(0);
17791f4df5f7SStefano Zampini }
17801f4df5f7SStefano Zampini 
17813e589ea0SStefano Zampini PetscErrorCode PCBDDCBenignRemoveInterior(PC pc,Vec r,Vec z)
17823e589ea0SStefano Zampini {
17833e589ea0SStefano Zampini   PC_IS             *pcis = (PC_IS*)(pc->data);
17843e589ea0SStefano Zampini   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
17853e589ea0SStefano Zampini   PetscErrorCode    ierr;
17863e589ea0SStefano Zampini 
17873e589ea0SStefano Zampini   PetscFunctionBegin;
17883e589ea0SStefano Zampini   if (!pcbddc->benign_have_null) {
17893e589ea0SStefano Zampini     PetscFunctionReturn(0);
17903e589ea0SStefano Zampini   }
17913e589ea0SStefano Zampini   if (pcbddc->ChangeOfBasisMatrix) {
17923e589ea0SStefano Zampini     Vec swap;
17933e589ea0SStefano Zampini 
17943e589ea0SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,r,pcbddc->work_change);CHKERRQ(ierr);
17953e589ea0SStefano Zampini     swap = pcbddc->work_change;
17963e589ea0SStefano Zampini     pcbddc->work_change = r;
17973e589ea0SStefano Zampini     r = swap;
17983e589ea0SStefano Zampini   }
17993e589ea0SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18003e589ea0SStefano Zampini   ierr = VecScatterEnd(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18013e589ea0SStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
18023e589ea0SStefano Zampini   ierr = VecSet(z,0.);CHKERRQ(ierr);
18033e589ea0SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18043e589ea0SStefano Zampini   ierr = VecScatterEnd(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18053e589ea0SStefano Zampini   if (pcbddc->ChangeOfBasisMatrix) {
1806f913dca9SStefano Zampini     pcbddc->work_change = r;
18073e589ea0SStefano Zampini     ierr = VecCopy(z,pcbddc->work_change);CHKERRQ(ierr);
18083e589ea0SStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcbddc->work_change,z);CHKERRQ(ierr);
18093e589ea0SStefano Zampini   }
18103e589ea0SStefano Zampini   PetscFunctionReturn(0);
18113e589ea0SStefano Zampini }
18123e589ea0SStefano Zampini 
1813a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMult_Private_Private(Mat A, Vec x, Vec y, PetscBool transpose)
1814a3df083aSStefano Zampini {
1815a3df083aSStefano Zampini   PCBDDCBenignMatMult_ctx ctx;
1816a3df083aSStefano Zampini   PetscErrorCode          ierr;
1817a3df083aSStefano Zampini   PetscBool               apply_right,apply_left,reset_x;
1818a3df083aSStefano Zampini 
1819a3df083aSStefano Zampini   PetscFunctionBegin;
1820a3df083aSStefano Zampini   ierr = MatShellGetContext(A,&ctx);CHKERRQ(ierr);
1821a3df083aSStefano Zampini   if (transpose) {
1822a3df083aSStefano Zampini     apply_right = ctx->apply_left;
1823a3df083aSStefano Zampini     apply_left = ctx->apply_right;
1824a3df083aSStefano Zampini   } else {
1825a3df083aSStefano Zampini     apply_right = ctx->apply_right;
1826a3df083aSStefano Zampini     apply_left = ctx->apply_left;
1827a3df083aSStefano Zampini   }
1828a3df083aSStefano Zampini   reset_x = PETSC_FALSE;
1829a3df083aSStefano Zampini   if (apply_right) {
1830a3df083aSStefano Zampini     const PetscScalar *ax;
1831a3df083aSStefano Zampini     PetscInt          nl,i;
1832a3df083aSStefano Zampini 
1833a3df083aSStefano Zampini     ierr = VecGetLocalSize(x,&nl);CHKERRQ(ierr);
1834a3df083aSStefano Zampini     ierr = VecGetArrayRead(x,&ax);CHKERRQ(ierr);
1835a3df083aSStefano Zampini     ierr = PetscMemcpy(ctx->work,ax,nl*sizeof(PetscScalar));CHKERRQ(ierr);
1836a3df083aSStefano Zampini     ierr = VecRestoreArrayRead(x,&ax);CHKERRQ(ierr);
1837a3df083aSStefano Zampini     for (i=0;i<ctx->benign_n;i++) {
1838a3df083aSStefano Zampini       PetscScalar    sum,val;
1839a3df083aSStefano Zampini       const PetscInt *idxs;
1840a3df083aSStefano Zampini       PetscInt       nz,j;
1841a3df083aSStefano Zampini       ierr = ISGetLocalSize(ctx->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr);
1842a3df083aSStefano Zampini       ierr = ISGetIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr);
1843a3df083aSStefano Zampini       sum = 0.;
1844a3df083aSStefano Zampini       if (ctx->apply_p0) {
1845a3df083aSStefano Zampini         val = ctx->work[idxs[nz-1]];
1846a3df083aSStefano Zampini         for (j=0;j<nz-1;j++) {
1847a3df083aSStefano Zampini           sum += ctx->work[idxs[j]];
1848a3df083aSStefano Zampini           ctx->work[idxs[j]] += val;
1849a3df083aSStefano Zampini         }
1850a3df083aSStefano Zampini       } else {
1851a3df083aSStefano Zampini         for (j=0;j<nz-1;j++) {
1852a3df083aSStefano Zampini           sum += ctx->work[idxs[j]];
1853a3df083aSStefano Zampini         }
1854a3df083aSStefano Zampini       }
1855a3df083aSStefano Zampini       ctx->work[idxs[nz-1]] -= sum;
1856a3df083aSStefano Zampini       ierr = ISRestoreIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr);
1857a3df083aSStefano Zampini     }
1858a3df083aSStefano Zampini     ierr = VecPlaceArray(x,ctx->work);CHKERRQ(ierr);
1859a3df083aSStefano Zampini     reset_x = PETSC_TRUE;
1860a3df083aSStefano Zampini   }
1861a3df083aSStefano Zampini   if (transpose) {
1862a3df083aSStefano Zampini     ierr = MatMultTranspose(ctx->A,x,y);CHKERRQ(ierr);
1863a3df083aSStefano Zampini   } else {
1864a3df083aSStefano Zampini     ierr = MatMult(ctx->A,x,y);CHKERRQ(ierr);
1865a3df083aSStefano Zampini   }
1866a3df083aSStefano Zampini   if (reset_x) {
1867a3df083aSStefano Zampini     ierr = VecResetArray(x);CHKERRQ(ierr);
1868a3df083aSStefano Zampini   }
1869a3df083aSStefano Zampini   if (apply_left) {
1870a3df083aSStefano Zampini     PetscScalar *ay;
1871a3df083aSStefano Zampini     PetscInt    i;
1872a3df083aSStefano Zampini 
1873a3df083aSStefano Zampini     ierr = VecGetArray(y,&ay);CHKERRQ(ierr);
1874a3df083aSStefano Zampini     for (i=0;i<ctx->benign_n;i++) {
1875a3df083aSStefano Zampini       PetscScalar    sum,val;
1876a3df083aSStefano Zampini       const PetscInt *idxs;
1877a3df083aSStefano Zampini       PetscInt       nz,j;
1878a3df083aSStefano Zampini       ierr = ISGetLocalSize(ctx->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr);
1879a3df083aSStefano Zampini       ierr = ISGetIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr);
1880a3df083aSStefano Zampini       val = -ay[idxs[nz-1]];
1881a3df083aSStefano Zampini       if (ctx->apply_p0) {
1882a3df083aSStefano Zampini         sum = 0.;
1883a3df083aSStefano Zampini         for (j=0;j<nz-1;j++) {
1884a3df083aSStefano Zampini           sum += ay[idxs[j]];
1885a3df083aSStefano Zampini           ay[idxs[j]] += val;
1886a3df083aSStefano Zampini         }
1887a3df083aSStefano Zampini         ay[idxs[nz-1]] += sum;
1888a3df083aSStefano Zampini       } else {
1889a3df083aSStefano Zampini         for (j=0;j<nz-1;j++) {
1890a3df083aSStefano Zampini           ay[idxs[j]] += val;
1891a3df083aSStefano Zampini         }
1892a3df083aSStefano Zampini         ay[idxs[nz-1]] = 0.;
1893a3df083aSStefano Zampini       }
1894a3df083aSStefano Zampini       ierr = ISRestoreIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr);
1895a3df083aSStefano Zampini     }
1896a3df083aSStefano Zampini     ierr = VecRestoreArray(y,&ay);CHKERRQ(ierr);
1897a3df083aSStefano Zampini   }
1898a3df083aSStefano Zampini   PetscFunctionReturn(0);
1899a3df083aSStefano Zampini }
1900a3df083aSStefano Zampini 
1901a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMultTranspose_Private(Mat A, Vec x, Vec y)
1902a3df083aSStefano Zampini {
1903a3df083aSStefano Zampini   PetscErrorCode ierr;
1904a3df083aSStefano Zampini 
1905a3df083aSStefano Zampini   PetscFunctionBegin;
1906a3df083aSStefano Zampini   ierr = PCBDDCBenignMatMult_Private_Private(A,x,y,PETSC_TRUE);CHKERRQ(ierr);
1907a3df083aSStefano Zampini   PetscFunctionReturn(0);
1908a3df083aSStefano Zampini }
1909a3df083aSStefano Zampini 
1910a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMult_Private(Mat A, Vec x, Vec y)
1911a3df083aSStefano Zampini {
1912a3df083aSStefano Zampini   PetscErrorCode ierr;
1913a3df083aSStefano Zampini 
1914a3df083aSStefano Zampini   PetscFunctionBegin;
1915a3df083aSStefano Zampini   ierr = PCBDDCBenignMatMult_Private_Private(A,x,y,PETSC_FALSE);CHKERRQ(ierr);
1916a3df083aSStefano Zampini   PetscFunctionReturn(0);
1917a3df083aSStefano Zampini }
1918a3df083aSStefano Zampini 
1919a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignShellMat(PC pc, PetscBool restore)
1920a3df083aSStefano Zampini {
1921a3df083aSStefano Zampini   PC_IS                   *pcis = (PC_IS*)pc->data;
1922a3df083aSStefano Zampini   PC_BDDC                 *pcbddc = (PC_BDDC*)pc->data;
1923a3df083aSStefano Zampini   PCBDDCBenignMatMult_ctx ctx;
1924a3df083aSStefano Zampini   PetscErrorCode          ierr;
1925a3df083aSStefano Zampini 
1926a3df083aSStefano Zampini   PetscFunctionBegin;
1927a3df083aSStefano Zampini   if (!restore) {
19281dd7afcfSStefano Zampini     Mat                A_IB,A_BI;
1929a3df083aSStefano Zampini     PetscScalar        *work;
1930b334f244SStefano Zampini     PCBDDCReuseSolvers reuse = pcbddc->sub_schurs ? pcbddc->sub_schurs->reuse_solver : NULL;
1931a3df083aSStefano Zampini 
19329a962809SStefano Zampini     if (pcbddc->benign_original_mat) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Benign original mat has not been restored");
19339a962809SStefano Zampini     if (!pcbddc->benign_change || !pcbddc->benign_n || pcbddc->benign_change_explicit) PetscFunctionReturn(0);
1934a3df083aSStefano Zampini     ierr = PetscMalloc1(pcis->n,&work);CHKERRQ(ierr);
1935a3df083aSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&A_IB);CHKERRQ(ierr);
1936a3df083aSStefano Zampini     ierr = MatSetSizes(A_IB,pcis->n-pcis->n_B,pcis->n_B,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
1937a3df083aSStefano Zampini     ierr = MatSetType(A_IB,MATSHELL);CHKERRQ(ierr);
1938a3df083aSStefano Zampini     ierr = MatShellSetOperation(A_IB,MATOP_MULT,(void (*)(void))PCBDDCBenignMatMult_Private);CHKERRQ(ierr);
1939a3df083aSStefano Zampini     ierr = MatShellSetOperation(A_IB,MATOP_MULT_TRANSPOSE,(void (*)(void))PCBDDCBenignMatMultTranspose_Private);CHKERRQ(ierr);
1940a3df083aSStefano Zampini     ierr = PetscNew(&ctx);CHKERRQ(ierr);
1941a3df083aSStefano Zampini     ierr = MatShellSetContext(A_IB,ctx);CHKERRQ(ierr);
1942a3df083aSStefano Zampini     ctx->apply_left = PETSC_TRUE;
1943a3df083aSStefano Zampini     ctx->apply_right = PETSC_FALSE;
1944a3df083aSStefano Zampini     ctx->apply_p0 = PETSC_FALSE;
1945a3df083aSStefano Zampini     ctx->benign_n = pcbddc->benign_n;
1946059032f7SStefano Zampini     if (reuse) {
1947a3df083aSStefano Zampini       ctx->benign_zerodiag_subs = reuse->benign_zerodiag_subs;
19481dd7afcfSStefano Zampini       ctx->free = PETSC_FALSE;
1949059032f7SStefano Zampini     } else { /* TODO: could be optimized for successive solves */
1950059032f7SStefano Zampini       ISLocalToGlobalMapping N_to_D;
1951059032f7SStefano Zampini       PetscInt               i;
1952059032f7SStefano Zampini 
1953059032f7SStefano Zampini       ierr = ISLocalToGlobalMappingCreateIS(pcis->is_I_local,&N_to_D);CHKERRQ(ierr);
1954059032f7SStefano Zampini       ierr = PetscMalloc1(pcbddc->benign_n,&ctx->benign_zerodiag_subs);CHKERRQ(ierr);
1955059032f7SStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) {
1956059032f7SStefano Zampini         ierr = ISGlobalToLocalMappingApplyIS(N_to_D,IS_GTOLM_DROP,pcbddc->benign_zerodiag_subs[i],&ctx->benign_zerodiag_subs[i]);CHKERRQ(ierr);
1957059032f7SStefano Zampini       }
1958059032f7SStefano Zampini       ierr = ISLocalToGlobalMappingDestroy(&N_to_D);CHKERRQ(ierr);
19591dd7afcfSStefano Zampini       ctx->free = PETSC_TRUE;
1960059032f7SStefano Zampini     }
1961a3df083aSStefano Zampini     ctx->A = pcis->A_IB;
1962a3df083aSStefano Zampini     ctx->work = work;
1963a3df083aSStefano Zampini     ierr = MatSetUp(A_IB);CHKERRQ(ierr);
1964a3df083aSStefano Zampini     ierr = MatAssemblyBegin(A_IB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1965a3df083aSStefano Zampini     ierr = MatAssemblyEnd(A_IB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1966a3df083aSStefano Zampini     pcis->A_IB = A_IB;
1967a3df083aSStefano Zampini 
1968a3df083aSStefano Zampini     /* A_BI as A_IB^T */
1969a3df083aSStefano Zampini     ierr = MatCreateTranspose(A_IB,&A_BI);CHKERRQ(ierr);
1970a3df083aSStefano Zampini     pcbddc->benign_original_mat = pcis->A_BI;
1971a3df083aSStefano Zampini     pcis->A_BI = A_BI;
1972a3df083aSStefano Zampini   } else {
19731dd7afcfSStefano Zampini     if (!pcbddc->benign_original_mat) {
19741dd7afcfSStefano Zampini       PetscFunctionReturn(0);
19751dd7afcfSStefano Zampini     }
1976a3df083aSStefano Zampini     ierr = MatShellGetContext(pcis->A_IB,&ctx);CHKERRQ(ierr);
1977a3df083aSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
1978a3df083aSStefano Zampini     pcis->A_IB = ctx->A;
19791dd7afcfSStefano Zampini     ctx->A = NULL;
19801dd7afcfSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
19811dd7afcfSStefano Zampini     pcis->A_BI = pcbddc->benign_original_mat;
19821dd7afcfSStefano Zampini     pcbddc->benign_original_mat = NULL;
19831dd7afcfSStefano Zampini     if (ctx->free) {
1984059032f7SStefano Zampini       PetscInt i;
19851dd7afcfSStefano Zampini       for (i=0;i<ctx->benign_n;i++) {
1986059032f7SStefano Zampini         ierr = ISDestroy(&ctx->benign_zerodiag_subs[i]);CHKERRQ(ierr);
1987059032f7SStefano Zampini       }
1988059032f7SStefano Zampini       ierr = PetscFree(ctx->benign_zerodiag_subs);CHKERRQ(ierr);
1989059032f7SStefano Zampini     }
1990a3df083aSStefano Zampini     ierr = PetscFree(ctx->work);CHKERRQ(ierr);
1991a3df083aSStefano Zampini     ierr = PetscFree(ctx);CHKERRQ(ierr);
1992a3df083aSStefano Zampini   }
1993a3df083aSStefano Zampini   PetscFunctionReturn(0);
1994a3df083aSStefano Zampini }
1995a3df083aSStefano Zampini 
1996a3df083aSStefano Zampini /* used just in bddc debug mode */
1997a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignProject(PC pc, IS is1, IS is2, Mat *B)
1998a3df083aSStefano Zampini {
1999a3df083aSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2000a3df083aSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
2001a3df083aSStefano Zampini   Mat            An;
2002a3df083aSStefano Zampini   PetscErrorCode ierr;
2003a3df083aSStefano Zampini 
2004a3df083aSStefano Zampini   PetscFunctionBegin;
2005a3df083aSStefano Zampini   ierr = MatPtAP(matis->A,pcbddc->benign_change,MAT_INITIAL_MATRIX,2.0,&An);CHKERRQ(ierr);
2006a3df083aSStefano Zampini   ierr = MatZeroRowsColumns(An,pcbddc->benign_n,pcbddc->benign_p0_lidx,1.0,NULL,NULL);CHKERRQ(ierr);
2007a3df083aSStefano Zampini   if (is1) {
20087dae84e0SHong Zhang     ierr = MatCreateSubMatrix(An,is1,is2,MAT_INITIAL_MATRIX,B);CHKERRQ(ierr);
2009a3df083aSStefano Zampini     ierr = MatDestroy(&An);CHKERRQ(ierr);
2010a3df083aSStefano Zampini   } else {
2011a3df083aSStefano Zampini     *B = An;
2012a3df083aSStefano Zampini   }
2013a3df083aSStefano Zampini   PetscFunctionReturn(0);
2014a3df083aSStefano Zampini }
2015a3df083aSStefano Zampini 
20161cf9b237SStefano Zampini /* TODO: add reuse flag */
20171cf9b237SStefano Zampini PetscErrorCode MatSeqAIJCompress(Mat A, Mat *B)
20181cf9b237SStefano Zampini {
20191cf9b237SStefano Zampini   Mat            Bt;
20201cf9b237SStefano Zampini   PetscScalar    *a,*bdata;
20211cf9b237SStefano Zampini   const PetscInt *ii,*ij;
20221cf9b237SStefano Zampini   PetscInt       m,n,i,nnz,*bii,*bij;
20231cf9b237SStefano Zampini   PetscBool      flg_row;
20241cf9b237SStefano Zampini   PetscErrorCode ierr;
20251cf9b237SStefano Zampini 
20261cf9b237SStefano Zampini   PetscFunctionBegin;
20271cf9b237SStefano Zampini   ierr = MatGetSize(A,&n,&m);CHKERRQ(ierr);
20281cf9b237SStefano Zampini   ierr = MatGetRowIJ(A,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&ij,&flg_row);CHKERRQ(ierr);
20291cf9b237SStefano Zampini   ierr = MatSeqAIJGetArray(A,&a);CHKERRQ(ierr);
20301cf9b237SStefano Zampini   nnz = n;
20311cf9b237SStefano Zampini   for (i=0;i<ii[n];i++) {
20321cf9b237SStefano Zampini     if (PetscLikely(PetscAbsScalar(a[i]) > PETSC_SMALL)) nnz++;
20331cf9b237SStefano Zampini   }
20341cf9b237SStefano Zampini   ierr = PetscMalloc1(n+1,&bii);CHKERRQ(ierr);
20351cf9b237SStefano Zampini   ierr = PetscMalloc1(nnz,&bij);CHKERRQ(ierr);
20361cf9b237SStefano Zampini   ierr = PetscMalloc1(nnz,&bdata);CHKERRQ(ierr);
20371cf9b237SStefano Zampini   nnz = 0;
20381cf9b237SStefano Zampini   bii[0] = 0;
20391cf9b237SStefano Zampini   for (i=0;i<n;i++) {
20401cf9b237SStefano Zampini     PetscInt j;
20411cf9b237SStefano Zampini     for (j=ii[i];j<ii[i+1];j++) {
20421cf9b237SStefano Zampini       PetscScalar entry = a[j];
20431cf9b237SStefano Zampini       if (PetscLikely(PetscAbsScalar(entry) > PETSC_SMALL) || ij[j] == i) {
20441cf9b237SStefano Zampini         bij[nnz] = ij[j];
20451cf9b237SStefano Zampini         bdata[nnz] = entry;
20461cf9b237SStefano Zampini         nnz++;
20471cf9b237SStefano Zampini       }
20481cf9b237SStefano Zampini     }
20491cf9b237SStefano Zampini     bii[i+1] = nnz;
20501cf9b237SStefano Zampini   }
20511cf9b237SStefano Zampini   ierr = MatSeqAIJRestoreArray(A,&a);CHKERRQ(ierr);
20521cf9b237SStefano Zampini   ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),n,m,bii,bij,bdata,&Bt);CHKERRQ(ierr);
20531cf9b237SStefano Zampini   ierr = MatRestoreRowIJ(A,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&ij,&flg_row);CHKERRQ(ierr);
20541cf9b237SStefano Zampini   {
20551cf9b237SStefano Zampini     Mat_SeqAIJ *b = (Mat_SeqAIJ*)(Bt->data);
20561cf9b237SStefano Zampini     b->free_a = PETSC_TRUE;
20571cf9b237SStefano Zampini     b->free_ij = PETSC_TRUE;
20581cf9b237SStefano Zampini   }
20591cf9b237SStefano Zampini   *B = Bt;
20601cf9b237SStefano Zampini   PetscFunctionReturn(0);
20611cf9b237SStefano Zampini }
20621cf9b237SStefano Zampini 
2063c80a6c00SStefano Zampini PetscErrorCode PCBDDCDetectDisconnectedComponents(PC pc, PetscInt *ncc, IS* cc[], IS* primalv)
20644f1b2e48SStefano Zampini {
2065c80a6c00SStefano Zampini   Mat                    B = NULL;
2066c80a6c00SStefano Zampini   DM                     dm;
20674f1b2e48SStefano Zampini   IS                     is_dummy,*cc_n;
20684f1b2e48SStefano Zampini   ISLocalToGlobalMapping l2gmap_dummy;
20694f1b2e48SStefano Zampini   PCBDDCGraph            graph;
2070c80a6c00SStefano Zampini   PetscInt               *xadj_filtered = NULL,*adjncy_filtered = NULL;
20714f1b2e48SStefano Zampini   PetscInt               i,n;
20724f1b2e48SStefano Zampini   PetscInt               *xadj,*adjncy;
2073c80a6c00SStefano Zampini   PetscBool              isplex = PETSC_FALSE;
20744f1b2e48SStefano Zampini   PetscErrorCode         ierr;
20754f1b2e48SStefano Zampini 
20764f1b2e48SStefano Zampini   PetscFunctionBegin;
2077a2eca866SStefano Zampini   if (ncc) *ncc = 0;
2078a2eca866SStefano Zampini   if (cc) *cc = NULL;
2079a2eca866SStefano Zampini   if (primalv) *primalv = NULL;
2080c80a6c00SStefano Zampini   ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr);
2081c80a6c00SStefano Zampini   ierr = PCGetDM(pc,&dm);CHKERRQ(ierr);
2082c80a6c00SStefano Zampini   if (!dm) {
2083c80a6c00SStefano Zampini     ierr = MatGetDM(pc->pmat,&dm);CHKERRQ(ierr);
2084c80a6c00SStefano Zampini   }
2085c80a6c00SStefano Zampini   if (dm) {
2086c80a6c00SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)dm,DMPLEX,&isplex);CHKERRQ(ierr);
2087c80a6c00SStefano Zampini   }
2088c80a6c00SStefano Zampini   if (isplex) { /* this code has been modified from plexpartition.c */
2089c80a6c00SStefano Zampini     PetscInt       p, pStart, pEnd, a, adjSize, idx, size, nroots;
2090c80a6c00SStefano Zampini     PetscInt      *adj = NULL;
2091c80a6c00SStefano Zampini     IS             cellNumbering;
2092c80a6c00SStefano Zampini     const PetscInt *cellNum;
2093c80a6c00SStefano Zampini     PetscBool      useCone, useClosure;
2094c80a6c00SStefano Zampini     PetscSection   section;
2095c80a6c00SStefano Zampini     PetscSegBuffer adjBuffer;
2096c80a6c00SStefano Zampini     PetscSF        sfPoint;
2097c80a6c00SStefano Zampini     PetscErrorCode ierr;
2098c80a6c00SStefano Zampini 
2099c80a6c00SStefano Zampini     PetscFunctionBegin;
2100c80a6c00SStefano Zampini     ierr = DMPlexGetHeightStratum(dm, 0, &pStart, &pEnd);CHKERRQ(ierr);
2101c80a6c00SStefano Zampini     ierr = DMGetPointSF(dm, &sfPoint);CHKERRQ(ierr);
2102c80a6c00SStefano Zampini     ierr = PetscSFGetGraph(sfPoint, &nroots, NULL, NULL, NULL);CHKERRQ(ierr);
2103c80a6c00SStefano Zampini     /* Build adjacency graph via a section/segbuffer */
2104c80a6c00SStefano Zampini     ierr = PetscSectionCreate(PetscObjectComm((PetscObject) dm), &section);CHKERRQ(ierr);
2105c80a6c00SStefano Zampini     ierr = PetscSectionSetChart(section, pStart, pEnd);CHKERRQ(ierr);
2106c80a6c00SStefano Zampini     ierr = PetscSegBufferCreate(sizeof(PetscInt),1000,&adjBuffer);CHKERRQ(ierr);
2107c80a6c00SStefano Zampini     /* Always use FVM adjacency to create partitioner graph */
2108c80a6c00SStefano Zampini     ierr = DMPlexGetAdjacencyUseCone(dm, &useCone);CHKERRQ(ierr);
2109c80a6c00SStefano Zampini     ierr = DMPlexGetAdjacencyUseClosure(dm, &useClosure);CHKERRQ(ierr);
2110c80a6c00SStefano Zampini     ierr = DMPlexSetAdjacencyUseCone(dm, PETSC_TRUE);CHKERRQ(ierr);
2111c80a6c00SStefano Zampini     ierr = DMPlexSetAdjacencyUseClosure(dm, PETSC_FALSE);CHKERRQ(ierr);
2112956e2312SStefano Zampini     ierr = DMPlexGetCellNumbering(dm, &cellNumbering);CHKERRQ(ierr);
2113c80a6c00SStefano Zampini     ierr = ISGetIndices(cellNumbering, &cellNum);CHKERRQ(ierr);
2114c80a6c00SStefano Zampini     for (n = 0, p = pStart; p < pEnd; p++) {
2115c80a6c00SStefano Zampini       /* Skip non-owned cells in parallel (ParMetis expects no overlap) */
2116c80a6c00SStefano Zampini       if (nroots > 0) {if (cellNum[p] < 0) continue;}
2117c80a6c00SStefano Zampini       adjSize = PETSC_DETERMINE;
2118c80a6c00SStefano Zampini       ierr = DMPlexGetAdjacency(dm, p, &adjSize, &adj);CHKERRQ(ierr);
2119c80a6c00SStefano Zampini       for (a = 0; a < adjSize; ++a) {
2120c80a6c00SStefano Zampini         const PetscInt point = adj[a];
21215cef3d0dSStefano Zampini         if (pStart <= point && point < pEnd) {
2122c80a6c00SStefano Zampini           PetscInt *PETSC_RESTRICT pBuf;
2123c80a6c00SStefano Zampini           ierr = PetscSectionAddDof(section, p, 1);CHKERRQ(ierr);
2124c80a6c00SStefano Zampini           ierr = PetscSegBufferGetInts(adjBuffer, 1, &pBuf);CHKERRQ(ierr);
2125c80a6c00SStefano Zampini           *pBuf = point;
2126c80a6c00SStefano Zampini         }
2127c80a6c00SStefano Zampini       }
2128c80a6c00SStefano Zampini       n++;
2129c80a6c00SStefano Zampini     }
2130c80a6c00SStefano Zampini     ierr = DMPlexSetAdjacencyUseCone(dm, useCone);CHKERRQ(ierr);
2131c80a6c00SStefano Zampini     ierr = DMPlexSetAdjacencyUseClosure(dm, useClosure);CHKERRQ(ierr);
2132c80a6c00SStefano Zampini     /* Derive CSR graph from section/segbuffer */
2133c80a6c00SStefano Zampini     ierr = PetscSectionSetUp(section);CHKERRQ(ierr);
2134c80a6c00SStefano Zampini     ierr = PetscSectionGetStorageSize(section, &size);CHKERRQ(ierr);
2135c80a6c00SStefano Zampini     ierr = PetscMalloc1(n+1, &xadj);CHKERRQ(ierr);
2136c80a6c00SStefano Zampini     for (idx = 0, p = pStart; p < pEnd; p++) {
2137c80a6c00SStefano Zampini       if (nroots > 0) {if (cellNum[p] < 0) continue;}
2138c80a6c00SStefano Zampini       ierr = PetscSectionGetOffset(section, p, &(xadj[idx++]));CHKERRQ(ierr);
2139c80a6c00SStefano Zampini     }
2140c80a6c00SStefano Zampini     xadj[n] = size;
2141c80a6c00SStefano Zampini     ierr = PetscSegBufferExtractAlloc(adjBuffer, &adjncy);CHKERRQ(ierr);
2142c80a6c00SStefano Zampini     /* Clean up */
2143c80a6c00SStefano Zampini     ierr = PetscSegBufferDestroy(&adjBuffer);CHKERRQ(ierr);
2144c80a6c00SStefano Zampini     ierr = PetscSectionDestroy(&section);CHKERRQ(ierr);
2145c80a6c00SStefano Zampini     ierr = PetscFree(adj);CHKERRQ(ierr);
2146c80a6c00SStefano Zampini     graph->xadj = xadj;
2147c80a6c00SStefano Zampini     graph->adjncy = adjncy;
2148c80a6c00SStefano Zampini   } else {
2149c80a6c00SStefano Zampini     Mat       A;
2150c80a6c00SStefano Zampini     PetscBool filter = PETSC_FALSE, isseqaij, flg_row;
2151c80a6c00SStefano Zampini 
2152c80a6c00SStefano Zampini     ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr);
215363c961adSStefano Zampini     if (!A->rmap->N || !A->cmap->N) {
2154a2eca866SStefano Zampini       ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr);
215563c961adSStefano Zampini       PetscFunctionReturn(0);
215663c961adSStefano Zampini     }
21574f1b2e48SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isseqaij);CHKERRQ(ierr);
21584f1b2e48SStefano Zampini     if (!isseqaij && filter) {
21591cf9b237SStefano Zampini       PetscBool isseqdense;
21601cf9b237SStefano Zampini 
21611cf9b237SStefano Zampini       ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQDENSE,&isseqdense);CHKERRQ(ierr);
21621cf9b237SStefano Zampini       if (!isseqdense) {
21634f1b2e48SStefano Zampini         ierr = MatConvert(A,MATSEQAIJ,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr);
21641cf9b237SStefano Zampini       } else { /* TODO: rectangular case and LDA */
21651cf9b237SStefano Zampini         PetscScalar *array;
21661cf9b237SStefano Zampini         PetscReal   chop=1.e-6;
21671cf9b237SStefano Zampini 
21681cf9b237SStefano Zampini         ierr = MatDuplicate(A,MAT_COPY_VALUES,&B);CHKERRQ(ierr);
21691cf9b237SStefano Zampini         ierr = MatDenseGetArray(B,&array);CHKERRQ(ierr);
21701cf9b237SStefano Zampini         ierr = MatGetSize(B,&n,NULL);CHKERRQ(ierr);
21711cf9b237SStefano Zampini         for (i=0;i<n;i++) {
21721cf9b237SStefano Zampini           PetscInt j;
21731cf9b237SStefano Zampini           for (j=i+1;j<n;j++) {
21741cf9b237SStefano Zampini             PetscReal thresh = chop*(PetscAbsScalar(array[i*(n+1)])+PetscAbsScalar(array[j*(n+1)]));
21751cf9b237SStefano Zampini             if (PetscAbsScalar(array[i*n+j]) < thresh) array[i*n+j] = 0.;
21761cf9b237SStefano Zampini             if (PetscAbsScalar(array[j*n+i]) < thresh) array[j*n+i] = 0.;
21771cf9b237SStefano Zampini           }
21781cf9b237SStefano Zampini         }
21791cf9b237SStefano Zampini         ierr = MatDenseRestoreArray(B,&array);CHKERRQ(ierr);
21809d54b7f4SStefano Zampini         ierr = MatConvert(B,MATSEQAIJ,MAT_INPLACE_MATRIX,&B);CHKERRQ(ierr);
21811cf9b237SStefano Zampini       }
21824f1b2e48SStefano Zampini     } else {
2183c80a6c00SStefano Zampini       ierr = PetscObjectReference((PetscObject)A);CHKERRQ(ierr);
21844f1b2e48SStefano Zampini       B = A;
21854f1b2e48SStefano Zampini     }
21864f1b2e48SStefano Zampini     ierr = MatGetRowIJ(B,0,PETSC_TRUE,PETSC_FALSE,&n,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr);
21874f1b2e48SStefano Zampini 
21884f1b2e48SStefano Zampini     /* if filter is true, then removes entries lower than PETSC_SMALL in magnitude */
21894f1b2e48SStefano Zampini     if (filter) {
21904f1b2e48SStefano Zampini       PetscScalar *data;
21914f1b2e48SStefano Zampini       PetscInt    j,cum;
21924f1b2e48SStefano Zampini 
21934f1b2e48SStefano Zampini       ierr = PetscCalloc2(n+1,&xadj_filtered,xadj[n],&adjncy_filtered);CHKERRQ(ierr);
21944f1b2e48SStefano Zampini       ierr = MatSeqAIJGetArray(B,&data);CHKERRQ(ierr);
21954f1b2e48SStefano Zampini       cum = 0;
21964f1b2e48SStefano Zampini       for (i=0;i<n;i++) {
21974f1b2e48SStefano Zampini         PetscInt t;
21984f1b2e48SStefano Zampini 
21994f1b2e48SStefano Zampini         for (j=xadj[i];j<xadj[i+1];j++) {
22004f1b2e48SStefano Zampini           if (PetscUnlikely(PetscAbsScalar(data[j]) < PETSC_SMALL)) {
22014f1b2e48SStefano Zampini             continue;
22024f1b2e48SStefano Zampini           }
22034f1b2e48SStefano Zampini           adjncy_filtered[cum+xadj_filtered[i]++] = adjncy[j];
22044f1b2e48SStefano Zampini         }
22054f1b2e48SStefano Zampini         t = xadj_filtered[i];
22064f1b2e48SStefano Zampini         xadj_filtered[i] = cum;
22074f1b2e48SStefano Zampini         cum += t;
22084f1b2e48SStefano Zampini       }
22094f1b2e48SStefano Zampini       ierr = MatSeqAIJRestoreArray(B,&data);CHKERRQ(ierr);
22104f1b2e48SStefano Zampini       graph->xadj = xadj_filtered;
22114f1b2e48SStefano Zampini       graph->adjncy = adjncy_filtered;
22124f1b2e48SStefano Zampini     } else {
22134f1b2e48SStefano Zampini       graph->xadj = xadj;
22144f1b2e48SStefano Zampini       graph->adjncy = adjncy;
22154f1b2e48SStefano Zampini     }
2216c80a6c00SStefano Zampini   }
2217c80a6c00SStefano Zampini   /* compute local connected components using PCBDDCGraph */
2218c80a6c00SStefano Zampini   ierr = ISCreateStride(PETSC_COMM_SELF,n,0,1,&is_dummy);CHKERRQ(ierr);
2219c80a6c00SStefano Zampini   ierr = ISLocalToGlobalMappingCreateIS(is_dummy,&l2gmap_dummy);CHKERRQ(ierr);
2220c80a6c00SStefano Zampini   ierr = ISDestroy(&is_dummy);CHKERRQ(ierr);
2221c80a6c00SStefano Zampini   ierr = PCBDDCGraphInit(graph,l2gmap_dummy,n,PETSC_MAX_INT);CHKERRQ(ierr);
2222c80a6c00SStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&l2gmap_dummy);CHKERRQ(ierr);
22234f1b2e48SStefano Zampini   ierr = PCBDDCGraphSetUp(graph,1,NULL,NULL,0,NULL,NULL);CHKERRQ(ierr);
22244f1b2e48SStefano Zampini   ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr);
2225c80a6c00SStefano Zampini 
22264f1b2e48SStefano Zampini   /* partial clean up */
22274f1b2e48SStefano Zampini   ierr = PetscFree2(xadj_filtered,adjncy_filtered);CHKERRQ(ierr);
2228c80a6c00SStefano Zampini   if (B) {
2229c80a6c00SStefano Zampini     PetscBool flg_row;
22304f1b2e48SStefano Zampini     ierr = MatRestoreRowIJ(B,0,PETSC_TRUE,PETSC_FALSE,&n,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr);
22314f1b2e48SStefano Zampini     ierr = MatDestroy(&B);CHKERRQ(ierr);
22324f1b2e48SStefano Zampini   }
2233c80a6c00SStefano Zampini   if (isplex) {
2234c80a6c00SStefano Zampini     ierr = PetscFree(xadj);CHKERRQ(ierr);
2235c80a6c00SStefano Zampini     ierr = PetscFree(adjncy);CHKERRQ(ierr);
2236c80a6c00SStefano Zampini   }
22374f1b2e48SStefano Zampini 
22384f1b2e48SStefano Zampini   /* get back data */
2239c80a6c00SStefano Zampini   if (isplex) {
2240c80a6c00SStefano Zampini     if (ncc) *ncc = graph->ncc;
2241c80a6c00SStefano Zampini     if (cc || primalv) {
2242c80a6c00SStefano Zampini       Mat          A;
2243c80a6c00SStefano Zampini       PetscBT      btv,btvt;
2244c80a6c00SStefano Zampini       PetscSection subSection;
2245c80a6c00SStefano Zampini       PetscInt     *ids,cum,cump,*cids,*pids;
2246c80a6c00SStefano Zampini 
2247c80a6c00SStefano Zampini       ierr = DMPlexGetSubdomainSection(dm,&subSection);CHKERRQ(ierr);
2248c80a6c00SStefano Zampini       ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr);
2249c80a6c00SStefano Zampini       ierr = PetscMalloc3(A->rmap->n,&ids,graph->ncc+1,&cids,A->rmap->n,&pids);CHKERRQ(ierr);
2250c80a6c00SStefano Zampini       ierr = PetscBTCreate(A->rmap->n,&btv);CHKERRQ(ierr);
2251c80a6c00SStefano Zampini       ierr = PetscBTCreate(A->rmap->n,&btvt);CHKERRQ(ierr);
2252c80a6c00SStefano Zampini 
2253c80a6c00SStefano Zampini       cids[0] = 0;
2254c80a6c00SStefano Zampini       for (i = 0, cump = 0, cum = 0; i < graph->ncc; i++) {
2255c80a6c00SStefano Zampini         PetscInt j;
2256c80a6c00SStefano Zampini 
2257c80a6c00SStefano Zampini         ierr = PetscBTMemzero(A->rmap->n,btvt);CHKERRQ(ierr);
2258c80a6c00SStefano Zampini         for (j = graph->cptr[i]; j < graph->cptr[i+1]; j++) {
2259c80a6c00SStefano Zampini           PetscInt k, size, *closure = NULL, cell = graph->queue[j];
2260c80a6c00SStefano Zampini 
2261c80a6c00SStefano Zampini           ierr = DMPlexGetTransitiveClosure(dm,cell,PETSC_TRUE,&size,&closure);CHKERRQ(ierr);
2262c80a6c00SStefano Zampini           for (k = 0; k < 2*size; k += 2) {
2263c80a6c00SStefano Zampini             PetscInt s, p = closure[k], off, dof, cdof;
2264c80a6c00SStefano Zampini 
2265c80a6c00SStefano Zampini             ierr = PetscSectionGetConstraintDof(subSection, p, &cdof);CHKERRQ(ierr);
2266c80a6c00SStefano Zampini             ierr = PetscSectionGetOffset(subSection,p,&off);CHKERRQ(ierr);
2267c80a6c00SStefano Zampini             ierr = PetscSectionGetDof(subSection,p,&dof);CHKERRQ(ierr);
2268c80a6c00SStefano Zampini             for (s = 0; s < dof-cdof; s++) {
2269c80a6c00SStefano Zampini               if (PetscBTLookupSet(btvt,off+s)) continue;
2270c80a6c00SStefano Zampini               if (!PetscBTLookup(btv,off+s)) {
2271c80a6c00SStefano Zampini                 ids[cum++] = off+s;
2272c80a6c00SStefano Zampini               } else { /* cross-vertex */
2273c80a6c00SStefano Zampini                 pids[cump++] = off+s;
2274c80a6c00SStefano Zampini               }
2275c80a6c00SStefano Zampini             }
2276c80a6c00SStefano Zampini           }
2277c80a6c00SStefano Zampini           ierr = DMPlexRestoreTransitiveClosure(dm,cell,PETSC_TRUE,&size,&closure);CHKERRQ(ierr);
2278c80a6c00SStefano Zampini         }
2279c80a6c00SStefano Zampini         cids[i+1] = cum;
2280c80a6c00SStefano Zampini         /* mark dofs as already assigned */
2281c80a6c00SStefano Zampini         for (j = cids[i]; j < cids[i+1]; j++) {
2282c80a6c00SStefano Zampini           ierr = PetscBTSet(btv,ids[j]);CHKERRQ(ierr);
2283c80a6c00SStefano Zampini         }
2284c80a6c00SStefano Zampini       }
2285c80a6c00SStefano Zampini       if (cc) {
2286c80a6c00SStefano Zampini         ierr = PetscMalloc1(graph->ncc,&cc_n);CHKERRQ(ierr);
2287c80a6c00SStefano Zampini         for (i = 0; i < graph->ncc; i++) {
2288c80a6c00SStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,cids[i+1]-cids[i],ids+cids[i],PETSC_COPY_VALUES,&cc_n[i]);CHKERRQ(ierr);
2289c80a6c00SStefano Zampini         }
2290c80a6c00SStefano Zampini         *cc = cc_n;
2291c80a6c00SStefano Zampini       }
2292c80a6c00SStefano Zampini       if (primalv) {
2293c80a6c00SStefano Zampini         ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),cump,pids,PETSC_COPY_VALUES,primalv);CHKERRQ(ierr);
2294c80a6c00SStefano Zampini       }
2295c80a6c00SStefano Zampini       ierr = PetscFree3(ids,cids,pids);CHKERRQ(ierr);
2296c80a6c00SStefano Zampini       ierr = PetscBTDestroy(&btv);CHKERRQ(ierr);
2297c80a6c00SStefano Zampini       ierr = PetscBTDestroy(&btvt);CHKERRQ(ierr);
2298c80a6c00SStefano Zampini     }
2299c80a6c00SStefano Zampini   } else {
23001cf9b237SStefano Zampini     if (ncc) *ncc = graph->ncc;
23011cf9b237SStefano Zampini     if (cc) {
23024f1b2e48SStefano Zampini       ierr = PetscMalloc1(graph->ncc,&cc_n);CHKERRQ(ierr);
23034f1b2e48SStefano Zampini       for (i=0;i<graph->ncc;i++) {
23044f1b2e48SStefano Zampini         ierr = ISCreateGeneral(PETSC_COMM_SELF,graph->cptr[i+1]-graph->cptr[i],graph->queue+graph->cptr[i],PETSC_COPY_VALUES,&cc_n[i]);CHKERRQ(ierr);
23054f1b2e48SStefano Zampini       }
23064f1b2e48SStefano Zampini       *cc = cc_n;
23071cf9b237SStefano Zampini     }
2308c80a6c00SStefano Zampini   }
23094f1b2e48SStefano Zampini   /* clean up graph */
23104f1b2e48SStefano Zampini   graph->xadj = 0;
23114f1b2e48SStefano Zampini   graph->adjncy = 0;
23124f1b2e48SStefano Zampini   ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr);
23134f1b2e48SStefano Zampini   PetscFunctionReturn(0);
23144f1b2e48SStefano Zampini }
23154f1b2e48SStefano Zampini 
23165408967cSStefano Zampini PetscErrorCode PCBDDCBenignCheck(PC pc, IS zerodiag)
23175408967cSStefano Zampini {
23185408967cSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
23195408967cSStefano Zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
2320dee84bffSStefano Zampini   IS             dirIS = NULL;
23214f1b2e48SStefano Zampini   PetscInt       i;
23225408967cSStefano Zampini   PetscErrorCode ierr;
23235408967cSStefano Zampini 
23245408967cSStefano Zampini   PetscFunctionBegin;
2325dee84bffSStefano Zampini   ierr = PCBDDCGraphGetDirichletDofs(pcbddc->mat_graph,&dirIS);CHKERRQ(ierr);
23265408967cSStefano Zampini   if (zerodiag) {
23275408967cSStefano Zampini     Mat            A;
23285408967cSStefano Zampini     Vec            vec3_N;
23295408967cSStefano Zampini     PetscScalar    *vals;
23305408967cSStefano Zampini     const PetscInt *idxs;
2331d12d3064SStefano Zampini     PetscInt       nz,*count;
23325408967cSStefano Zampini 
23335408967cSStefano Zampini     /* p0 */
23345408967cSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.);CHKERRQ(ierr);
23355408967cSStefano Zampini     ierr = PetscMalloc1(pcis->n,&vals);CHKERRQ(ierr);
23365408967cSStefano Zampini     ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr);
23375408967cSStefano Zampini     ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr);
23384f1b2e48SStefano Zampini     for (i=0;i<nz;i++) vals[i] = 1.;
23395408967cSStefano Zampini     ierr = VecSetValues(pcis->vec1_N,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
23405408967cSStefano Zampini     ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr);
23415408967cSStefano Zampini     ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr);
23425408967cSStefano Zampini     /* v_I */
23435408967cSStefano Zampini     ierr = VecSetRandom(pcis->vec2_N,NULL);CHKERRQ(ierr);
23445408967cSStefano Zampini     for (i=0;i<nz;i++) vals[i] = 0.;
23455408967cSStefano Zampini     ierr = VecSetValues(pcis->vec2_N,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
23465408967cSStefano Zampini     ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr);
23475408967cSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr);
23485408967cSStefano Zampini     for (i=0;i<pcis->n_B;i++) vals[i] = 0.;
23495408967cSStefano Zampini     ierr = VecSetValues(pcis->vec2_N,pcis->n_B,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
23505408967cSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr);
23515408967cSStefano Zampini     if (dirIS) {
23525408967cSStefano Zampini       PetscInt n;
23535408967cSStefano Zampini 
23545408967cSStefano Zampini       ierr = ISGetLocalSize(dirIS,&n);CHKERRQ(ierr);
23555408967cSStefano Zampini       ierr = ISGetIndices(dirIS,&idxs);CHKERRQ(ierr);
23565408967cSStefano Zampini       for (i=0;i<n;i++) vals[i] = 0.;
23575408967cSStefano Zampini       ierr = VecSetValues(pcis->vec2_N,n,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
23585408967cSStefano Zampini       ierr = ISRestoreIndices(dirIS,&idxs);CHKERRQ(ierr);
23595408967cSStefano Zampini     }
23605408967cSStefano Zampini     ierr = VecAssemblyBegin(pcis->vec2_N);CHKERRQ(ierr);
23615408967cSStefano Zampini     ierr = VecAssemblyEnd(pcis->vec2_N);CHKERRQ(ierr);
23625408967cSStefano Zampini     ierr = VecDuplicate(pcis->vec1_N,&vec3_N);CHKERRQ(ierr);
23635408967cSStefano Zampini     ierr = VecSet(vec3_N,0.);CHKERRQ(ierr);
2364669cc0f4SStefano Zampini     ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr);
23655408967cSStefano Zampini     ierr = MatMult(A,pcis->vec1_N,vec3_N);CHKERRQ(ierr);
23665408967cSStefano Zampini     ierr = VecDot(vec3_N,pcis->vec2_N,&vals[0]);CHKERRQ(ierr);
23679a962809SStefano Zampini     if (PetscAbsScalar(vals[0]) > 1.e-1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Benign trick can not be applied! b(v_I,p_0) = %1.6e (should be numerically 0.)",PetscAbsScalar(vals[0]));
23685408967cSStefano Zampini     ierr = PetscFree(vals);CHKERRQ(ierr);
23695408967cSStefano Zampini     ierr = VecDestroy(&vec3_N);CHKERRQ(ierr);
2370d12d3064SStefano Zampini 
2371d12d3064SStefano Zampini     /* there should not be any pressure dofs lying on the interface */
2372d12d3064SStefano Zampini     ierr = PetscCalloc1(pcis->n,&count);CHKERRQ(ierr);
2373d12d3064SStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr);
2374d12d3064SStefano Zampini     for (i=0;i<pcis->n_B;i++) count[idxs[i]]++;
2375d12d3064SStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr);
2376d12d3064SStefano Zampini     ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr);
23779a962809SStefano Zampini     for (i=0;i<nz;i++) if (count[idxs[i]]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Benign trick can not be applied! pressure dof %d is an interface dof",idxs[i]);
2378d12d3064SStefano Zampini     ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr);
2379d12d3064SStefano Zampini     ierr = PetscFree(count);CHKERRQ(ierr);
23805408967cSStefano Zampini   }
2381dee84bffSStefano Zampini   ierr = ISDestroy(&dirIS);CHKERRQ(ierr);
23825408967cSStefano Zampini 
23835408967cSStefano Zampini   /* check PCBDDCBenignGetOrSetP0 */
23845408967cSStefano Zampini   ierr = VecSetRandom(pcis->vec1_global,NULL);CHKERRQ(ierr);
23854f1b2e48SStefano Zampini   for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = -PetscGlobalRank-i;
23865408967cSStefano Zampini   ierr = PCBDDCBenignGetOrSetP0(pc,pcis->vec1_global,PETSC_FALSE);CHKERRQ(ierr);
23874f1b2e48SStefano Zampini   for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = 1;
23885408967cSStefano Zampini   ierr = PCBDDCBenignGetOrSetP0(pc,pcis->vec1_global,PETSC_TRUE);CHKERRQ(ierr);
2389f2a566d8SStefano Zampini   for (i=0;i<pcbddc->benign_n;i++) {
2390f2a566d8SStefano Zampini     PetscInt val = PetscRealPart(pcbddc->benign_p0[i]);
239113903a91SSatish Balay     if (val != -PetscGlobalRank-i) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error testing PCBDDCBenignGetOrSetP0! Found %g at %d instead of %g\n",PetscRealPart(pcbddc->benign_p0[i]),i,-PetscGlobalRank-i);
2392f2a566d8SStefano Zampini   }
23935408967cSStefano Zampini   PetscFunctionReturn(0);
23945408967cSStefano Zampini }
23955408967cSStefano Zampini 
2396339f8db1SStefano Zampini PetscErrorCode PCBDDCBenignDetectSaddlePoint(PC pc, IS *zerodiaglocal)
2397339f8db1SStefano Zampini {
2398339f8db1SStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
23994edc6404Sstefano_zampini   IS             pressures,zerodiag,zerodiag_save,*zerodiag_subs;
2400b0f5fe93SStefano Zampini   PetscInt       nz,n;
24014edc6404Sstefano_zampini   PetscInt       *interior_dofs,n_interior_dofs,nneu;
24024edc6404Sstefano_zampini   PetscBool      sorted,have_null,has_null_pressures,recompute_zerodiag,checkb;
2403339f8db1SStefano Zampini   PetscErrorCode ierr;
2404339f8db1SStefano Zampini 
2405339f8db1SStefano Zampini   PetscFunctionBegin;
24069f47a83aSStefano Zampini   ierr = PetscSFDestroy(&pcbddc->benign_sf);CHKERRQ(ierr);
24079f47a83aSStefano Zampini   ierr = MatDestroy(&pcbddc->benign_B0);CHKERRQ(ierr);
2408a3df083aSStefano Zampini   for (n=0;n<pcbddc->benign_n;n++) {
2409a3df083aSStefano Zampini     ierr = ISDestroy(&pcbddc->benign_zerodiag_subs[n]);CHKERRQ(ierr);
2410a3df083aSStefano Zampini   }
2411a3df083aSStefano Zampini   ierr = PetscFree(pcbddc->benign_zerodiag_subs);CHKERRQ(ierr);
2412a3df083aSStefano Zampini   pcbddc->benign_n = 0;
241328b8efb1Sstefano_zampini 
241428b8efb1Sstefano_zampini   /* if a local info on dofs is present, uses the last field for "pressures" (or fid by command line)
24154f1b2e48SStefano Zampini      otherwise, it uses only zerodiagonal dofs (ok if the pressure block is all zero; it could fail if it is not)
24164f1b2e48SStefano Zampini      Checks if all the pressure dofs in each subdomain have a zero diagonal
24174f1b2e48SStefano Zampini      If not, a change of basis on pressures is not needed
24181ae86dd6SStefano Zampini      since the local Schur complements are already SPD
24194f1b2e48SStefano Zampini   */
24204f1b2e48SStefano Zampini   has_null_pressures = PETSC_TRUE;
24214f1b2e48SStefano Zampini   have_null = PETSC_TRUE;
242240fa8d13SStefano Zampini   if (pcbddc->n_ISForDofsLocal) {
24237fbe2174Sstefano_zampini     IS       iP = NULL;
24244f1b2e48SStefano Zampini     PetscInt npl,*idxs,p = pcbddc->n_ISForDofsLocal-1;
24254f1b2e48SStefano Zampini 
242628b8efb1Sstefano_zampini     ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC benign options","PC");CHKERRQ(ierr);
242728b8efb1Sstefano_zampini     ierr = PetscOptionsInt("-pc_bddc_pressure_field","Field id for pressures",NULL,p,&p,NULL);CHKERRQ(ierr);
242828b8efb1Sstefano_zampini     ierr = PetscOptionsEnd();CHKERRQ(ierr);
242928b8efb1Sstefano_zampini     if (p < 0 || p > pcbddc->n_ISForDofsLocal-1) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Invalid field id for pressures %D",p);
24304f1b2e48SStefano Zampini     /* Dofs splitting for BDDC cannot have PETSC_COMM_SELF, so create a sequential IS */
24314f1b2e48SStefano Zampini     ierr = ISGetLocalSize(pcbddc->ISForDofsLocal[p],&npl);CHKERRQ(ierr);
24324f1b2e48SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofsLocal[p],(const PetscInt**)&idxs);CHKERRQ(ierr);
24334f1b2e48SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,npl,idxs,PETSC_COPY_VALUES,&pressures);CHKERRQ(ierr);
2434ba14f8e3SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofsLocal[p],(const PetscInt**)&idxs);CHKERRQ(ierr);
24357fbe2174Sstefano_zampini     /* remove zeroed out pressures if we are setting up a BDDC solver for a saddle-point FETI-DP */
24367fbe2174Sstefano_zampini     ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_lP",(PetscObject*)&iP);CHKERRQ(ierr);
24377fbe2174Sstefano_zampini     if (iP) {
24387fbe2174Sstefano_zampini       IS newpressures;
24397fbe2174Sstefano_zampini 
24407fbe2174Sstefano_zampini       ierr = ISDifference(pressures,iP,&newpressures);CHKERRQ(ierr);
24417fbe2174Sstefano_zampini       ierr = ISDestroy(&pressures);CHKERRQ(ierr);
24427fbe2174Sstefano_zampini       pressures = newpressures;
24437fbe2174Sstefano_zampini     }
244440fa8d13SStefano Zampini     ierr = ISSorted(pressures,&sorted);CHKERRQ(ierr);
244540fa8d13SStefano Zampini     if (!sorted) {
244640fa8d13SStefano Zampini       ierr = ISSort(pressures);CHKERRQ(ierr);
244740fa8d13SStefano Zampini     }
244840fa8d13SStefano Zampini   } else {
244940fa8d13SStefano Zampini     pressures = NULL;
245040fa8d13SStefano Zampini   }
245197d764eeSStefano Zampini   /* pcis has not been setup yet, so get the local size from the subdomain matrix */
245297d764eeSStefano Zampini   ierr = MatGetLocalSize(pcbddc->local_mat,&n,NULL);CHKERRQ(ierr);
245327b6a85dSStefano Zampini   if (!n) pcbddc->benign_change_explicit = PETSC_TRUE;
245497d764eeSStefano Zampini   ierr = MatFindZeroDiagonals(pcbddc->local_mat,&zerodiag);CHKERRQ(ierr);
2455339f8db1SStefano Zampini   ierr = ISSorted(zerodiag,&sorted);CHKERRQ(ierr);
2456339f8db1SStefano Zampini   if (!sorted) {
2457339f8db1SStefano Zampini     ierr = ISSort(zerodiag);CHKERRQ(ierr);
2458339f8db1SStefano Zampini   }
24594edc6404Sstefano_zampini   ierr = PetscObjectReference((PetscObject)zerodiag);CHKERRQ(ierr);
24604edc6404Sstefano_zampini   zerodiag_save = zerodiag;
2461339f8db1SStefano Zampini   ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr);
24624f1b2e48SStefano Zampini   if (!nz) {
24634f1b2e48SStefano Zampini     if (n) have_null = PETSC_FALSE;
24644f1b2e48SStefano Zampini     has_null_pressures = PETSC_FALSE;
246540fa8d13SStefano Zampini     ierr = ISDestroy(&zerodiag);CHKERRQ(ierr);
246640fa8d13SStefano Zampini   }
24674f1b2e48SStefano Zampini   recompute_zerodiag = PETSC_FALSE;
24684f1b2e48SStefano Zampini   /* in case disconnected subdomains info is present, split the pressures accordingly (otherwise the benign trick could fail) */
24694f1b2e48SStefano Zampini   zerodiag_subs    = NULL;
24704f1b2e48SStefano Zampini   pcbddc->benign_n = 0;
24711f4df5f7SStefano Zampini   n_interior_dofs  = 0;
24721f4df5f7SStefano Zampini   interior_dofs    = NULL;
24734edc6404Sstefano_zampini   nneu             = 0;
24744edc6404Sstefano_zampini   if (pcbddc->NeumannBoundariesLocal) {
24754edc6404Sstefano_zampini     ierr = ISGetLocalSize(pcbddc->NeumannBoundariesLocal,&nneu);CHKERRQ(ierr);
24764edc6404Sstefano_zampini   }
24773369cb78Sstefano_zampini   checkb = (PetscBool)(!pcbddc->NeumannBoundariesLocal || pcbddc->current_level);
24784edc6404Sstefano_zampini   if (checkb) { /* need to compute interior nodes */
24791f4df5f7SStefano Zampini     PetscInt n,i,j;
24801f4df5f7SStefano Zampini     PetscInt n_neigh,*neigh,*n_shared,**shared;
24811f4df5f7SStefano Zampini     PetscInt *iwork;
24821f4df5f7SStefano Zampini 
24831f4df5f7SStefano Zampini     ierr = ISLocalToGlobalMappingGetSize(pc->pmat->rmap->mapping,&n);CHKERRQ(ierr);
24841f4df5f7SStefano Zampini     ierr = ISLocalToGlobalMappingGetInfo(pc->pmat->rmap->mapping,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
24851f4df5f7SStefano Zampini     ierr = PetscCalloc1(n,&iwork);CHKERRQ(ierr);
24861f4df5f7SStefano Zampini     ierr = PetscMalloc1(n,&interior_dofs);CHKERRQ(ierr);
248790648384SStefano Zampini     for (i=1;i<n_neigh;i++)
24881f4df5f7SStefano Zampini       for (j=0;j<n_shared[i];j++)
24891f4df5f7SStefano Zampini           iwork[shared[i][j]] += 1;
24901f4df5f7SStefano Zampini     for (i=0;i<n;i++)
24911f4df5f7SStefano Zampini       if (!iwork[i])
24921f4df5f7SStefano Zampini         interior_dofs[n_interior_dofs++] = i;
24931f4df5f7SStefano Zampini     ierr = PetscFree(iwork);CHKERRQ(ierr);
24941f4df5f7SStefano Zampini     ierr = ISLocalToGlobalMappingRestoreInfo(pc->pmat->rmap->mapping,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
24951f4df5f7SStefano Zampini   }
24964f1b2e48SStefano Zampini   if (has_null_pressures) {
24974f1b2e48SStefano Zampini     IS             *subs;
24984edc6404Sstefano_zampini     PetscInt       nsubs,i,j,nl;
24991f4df5f7SStefano Zampini     const PetscInt *idxs;
25001f4df5f7SStefano Zampini     PetscScalar    *array;
25011f4df5f7SStefano Zampini     Vec            *work;
25021f4df5f7SStefano Zampini     Mat_IS*        matis = (Mat_IS*)(pc->pmat->data);
25034f1b2e48SStefano Zampini 
25044f1b2e48SStefano Zampini     subs  = pcbddc->local_subs;
25054f1b2e48SStefano Zampini     nsubs = pcbddc->n_local_subs;
25061f4df5f7SStefano Zampini     /* these vectors are needed to check if the constant on pressures is in the kernel of the local operator B (i.e. B(v_I,p0) should be zero) */
25074edc6404Sstefano_zampini     if (checkb) {
25081f4df5f7SStefano Zampini       ierr = VecDuplicateVecs(matis->y,2,&work);CHKERRQ(ierr);
25091f4df5f7SStefano Zampini       ierr = ISGetLocalSize(zerodiag,&nl);CHKERRQ(ierr);
25101f4df5f7SStefano Zampini       ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr);
25111f4df5f7SStefano Zampini       /* work[0] = 1_p */
25121f4df5f7SStefano Zampini       ierr = VecSet(work[0],0.);CHKERRQ(ierr);
25131f4df5f7SStefano Zampini       ierr = VecGetArray(work[0],&array);CHKERRQ(ierr);
25141f4df5f7SStefano Zampini       for (j=0;j<nl;j++) array[idxs[j]] = 1.;
25151f4df5f7SStefano Zampini       ierr = VecRestoreArray(work[0],&array);CHKERRQ(ierr);
25161f4df5f7SStefano Zampini       /* work[0] = 1_v */
25171f4df5f7SStefano Zampini       ierr = VecSet(work[1],1.);CHKERRQ(ierr);
25181f4df5f7SStefano Zampini       ierr = VecGetArray(work[1],&array);CHKERRQ(ierr);
25191f4df5f7SStefano Zampini       for (j=0;j<nl;j++) array[idxs[j]] = 0.;
25201f4df5f7SStefano Zampini       ierr = VecRestoreArray(work[1],&array);CHKERRQ(ierr);
25211f4df5f7SStefano Zampini       ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr);
25221f4df5f7SStefano Zampini     }
25234f1b2e48SStefano Zampini     if (nsubs > 1) {
25244f1b2e48SStefano Zampini       ierr = PetscCalloc1(nsubs,&zerodiag_subs);CHKERRQ(ierr);
25254f1b2e48SStefano Zampini       for (i=0;i<nsubs;i++) {
25264f1b2e48SStefano Zampini         ISLocalToGlobalMapping l2g;
25274f1b2e48SStefano Zampini         IS                     t_zerodiag_subs;
25284f1b2e48SStefano Zampini         PetscInt               nl;
25294f1b2e48SStefano Zampini 
25304f1b2e48SStefano Zampini         ierr = ISLocalToGlobalMappingCreateIS(subs[i],&l2g);CHKERRQ(ierr);
25314f1b2e48SStefano Zampini         ierr = ISGlobalToLocalMappingApplyIS(l2g,IS_GTOLM_DROP,zerodiag,&t_zerodiag_subs);CHKERRQ(ierr);
25324f1b2e48SStefano Zampini         ierr = ISGetLocalSize(t_zerodiag_subs,&nl);CHKERRQ(ierr);
25334f1b2e48SStefano Zampini         if (nl) {
25344f1b2e48SStefano Zampini           PetscBool valid = PETSC_TRUE;
25354f1b2e48SStefano Zampini 
25364edc6404Sstefano_zampini           if (checkb) {
25371f4df5f7SStefano Zampini             ierr = VecSet(matis->x,0);CHKERRQ(ierr);
25381f4df5f7SStefano Zampini             ierr = ISGetLocalSize(subs[i],&nl);CHKERRQ(ierr);
25391f4df5f7SStefano Zampini             ierr = ISGetIndices(subs[i],&idxs);CHKERRQ(ierr);
25401f4df5f7SStefano Zampini             ierr = VecGetArray(matis->x,&array);CHKERRQ(ierr);
25411f4df5f7SStefano Zampini             for (j=0;j<nl;j++) array[idxs[j]] = 1.;
25421f4df5f7SStefano Zampini             ierr = VecRestoreArray(matis->x,&array);CHKERRQ(ierr);
25431f4df5f7SStefano Zampini             ierr = ISRestoreIndices(subs[i],&idxs);CHKERRQ(ierr);
25441f4df5f7SStefano Zampini             ierr = VecPointwiseMult(matis->x,work[0],matis->x);CHKERRQ(ierr);
25451f4df5f7SStefano Zampini             ierr = MatMult(matis->A,matis->x,matis->y);CHKERRQ(ierr);
25461f4df5f7SStefano Zampini             ierr = VecPointwiseMult(matis->y,work[1],matis->y);CHKERRQ(ierr);
25471f4df5f7SStefano Zampini             ierr = VecGetArray(matis->y,&array);CHKERRQ(ierr);
25481f4df5f7SStefano Zampini             for (j=0;j<n_interior_dofs;j++) {
25491f4df5f7SStefano Zampini               if (PetscAbsScalar(array[interior_dofs[j]]) > PETSC_SMALL) {
25501f4df5f7SStefano Zampini                 valid = PETSC_FALSE;
25511f4df5f7SStefano Zampini                 break;
25521f4df5f7SStefano Zampini               }
25531f4df5f7SStefano Zampini             }
25541f4df5f7SStefano Zampini             ierr = VecRestoreArray(matis->y,&array);CHKERRQ(ierr);
25551f4df5f7SStefano Zampini           }
25566632bad2Sstefano_zampini           if (valid && nneu) {
25576632bad2Sstefano_zampini             const PetscInt *idxs;
25581f4df5f7SStefano Zampini             PetscInt       nzb;
25591f4df5f7SStefano Zampini 
25606632bad2Sstefano_zampini             ierr = ISGetIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr);
25616632bad2Sstefano_zampini             ierr = ISGlobalToLocalMappingApply(l2g,IS_GTOLM_DROP,nneu,idxs,&nzb,NULL);CHKERRQ(ierr);
25626632bad2Sstefano_zampini             ierr = ISRestoreIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr);
25631f4df5f7SStefano Zampini             if (nzb) valid = PETSC_FALSE;
25641f4df5f7SStefano Zampini           }
25651f4df5f7SStefano Zampini           if (valid && pressures) {
25664f1b2e48SStefano Zampini             IS t_pressure_subs;
25674f1b2e48SStefano Zampini             ierr = ISGlobalToLocalMappingApplyIS(l2g,IS_GTOLM_DROP,pressures,&t_pressure_subs);CHKERRQ(ierr);
25684f1b2e48SStefano Zampini             ierr = ISEqual(t_pressure_subs,t_zerodiag_subs,&valid);CHKERRQ(ierr);
25694f1b2e48SStefano Zampini             ierr = ISDestroy(&t_pressure_subs);CHKERRQ(ierr);
25704f1b2e48SStefano Zampini           }
25714f1b2e48SStefano Zampini           if (valid) {
25724f1b2e48SStefano Zampini             ierr = ISLocalToGlobalMappingApplyIS(l2g,t_zerodiag_subs,&zerodiag_subs[pcbddc->benign_n]);CHKERRQ(ierr);
25734f1b2e48SStefano Zampini             pcbddc->benign_n++;
25744f1b2e48SStefano Zampini           } else {
25754f1b2e48SStefano Zampini             recompute_zerodiag = PETSC_TRUE;
25764f1b2e48SStefano Zampini           }
25774f1b2e48SStefano Zampini         }
25784f1b2e48SStefano Zampini         ierr = ISDestroy(&t_zerodiag_subs);CHKERRQ(ierr);
25794f1b2e48SStefano Zampini         ierr = ISLocalToGlobalMappingDestroy(&l2g);CHKERRQ(ierr);
25804f1b2e48SStefano Zampini       }
25814f1b2e48SStefano Zampini     } else { /* there's just one subdomain (or zero if they have not been detected */
25824f1b2e48SStefano Zampini       PetscBool valid = PETSC_TRUE;
25831f4df5f7SStefano Zampini 
25846632bad2Sstefano_zampini       if (nneu) valid = PETSC_FALSE;
25851f4df5f7SStefano Zampini       if (valid && pressures) {
25864f1b2e48SStefano Zampini         ierr = ISEqual(pressures,zerodiag,&valid);CHKERRQ(ierr);
25874f1b2e48SStefano Zampini       }
25884edc6404Sstefano_zampini       if (valid && checkb) {
25891f4df5f7SStefano Zampini         ierr = MatMult(matis->A,work[0],matis->x);CHKERRQ(ierr);
25901f4df5f7SStefano Zampini         ierr = VecPointwiseMult(matis->x,work[1],matis->x);CHKERRQ(ierr);
25911f4df5f7SStefano Zampini         ierr = VecGetArray(matis->x,&array);CHKERRQ(ierr);
25921f4df5f7SStefano Zampini         for (j=0;j<n_interior_dofs;j++) {
25931f4df5f7SStefano Zampini           if (PetscAbsScalar(array[interior_dofs[j]]) > PETSC_SMALL) {
25941f4df5f7SStefano Zampini             valid = PETSC_FALSE;
25951f4df5f7SStefano Zampini             break;
25961f4df5f7SStefano Zampini           }
25971f4df5f7SStefano Zampini         }
25981f4df5f7SStefano Zampini         ierr = VecRestoreArray(matis->x,&array);CHKERRQ(ierr);
25991f4df5f7SStefano Zampini       }
26004f1b2e48SStefano Zampini       if (valid) {
26014f1b2e48SStefano Zampini         pcbddc->benign_n = 1;
2602ca92afb2SStefano Zampini         ierr = PetscMalloc1(pcbddc->benign_n,&zerodiag_subs);CHKERRQ(ierr);
26034f1b2e48SStefano Zampini         ierr = PetscObjectReference((PetscObject)zerodiag);CHKERRQ(ierr);
26044f1b2e48SStefano Zampini         zerodiag_subs[0] = zerodiag;
26054f1b2e48SStefano Zampini       }
26064f1b2e48SStefano Zampini     }
26074edc6404Sstefano_zampini     if (checkb) {
26081f4df5f7SStefano Zampini       ierr = VecDestroyVecs(2,&work);CHKERRQ(ierr);
26094f1b2e48SStefano Zampini     }
26101f4df5f7SStefano Zampini   }
26111f4df5f7SStefano Zampini   ierr = PetscFree(interior_dofs);CHKERRQ(ierr);
26124f1b2e48SStefano Zampini 
26134f1b2e48SStefano Zampini   if (!pcbddc->benign_n) {
2614b9b0e38cSStefano Zampini     PetscInt n;
2615b9b0e38cSStefano Zampini 
26164f1b2e48SStefano Zampini     ierr = ISDestroy(&zerodiag);CHKERRQ(ierr);
26174f1b2e48SStefano Zampini     recompute_zerodiag = PETSC_FALSE;
2618b9b0e38cSStefano Zampini     ierr = MatGetLocalSize(pcbddc->local_mat,&n,NULL);CHKERRQ(ierr);
2619b9b0e38cSStefano Zampini     if (n) {
26204f1b2e48SStefano Zampini       has_null_pressures = PETSC_FALSE;
26214f1b2e48SStefano Zampini       have_null = PETSC_FALSE;
26224f1b2e48SStefano Zampini     }
2623b9b0e38cSStefano Zampini   }
26244f1b2e48SStefano Zampini 
26254f1b2e48SStefano Zampini   /* final check for null pressures */
26264f1b2e48SStefano Zampini   if (zerodiag && pressures) {
26274f1b2e48SStefano Zampini     PetscInt nz,np;
26284f1b2e48SStefano Zampini     ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr);
26294f1b2e48SStefano Zampini     ierr = ISGetLocalSize(pressures,&np);CHKERRQ(ierr);
26304f1b2e48SStefano Zampini     if (nz != np) have_null = PETSC_FALSE;
26314f1b2e48SStefano Zampini   }
26324f1b2e48SStefano Zampini 
26334f1b2e48SStefano Zampini   if (recompute_zerodiag) {
26344f1b2e48SStefano Zampini     ierr = ISDestroy(&zerodiag);CHKERRQ(ierr);
26354f1b2e48SStefano Zampini     if (pcbddc->benign_n == 1) {
26364f1b2e48SStefano Zampini       ierr = PetscObjectReference((PetscObject)zerodiag_subs[0]);CHKERRQ(ierr);
26374f1b2e48SStefano Zampini       zerodiag = zerodiag_subs[0];
26384f1b2e48SStefano Zampini     } else {
26394f1b2e48SStefano Zampini       PetscInt i,nzn,*new_idxs;
26404f1b2e48SStefano Zampini 
26414f1b2e48SStefano Zampini       nzn = 0;
26424f1b2e48SStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) {
26434f1b2e48SStefano Zampini         PetscInt ns;
26444f1b2e48SStefano Zampini         ierr = ISGetLocalSize(zerodiag_subs[i],&ns);CHKERRQ(ierr);
26454f1b2e48SStefano Zampini         nzn += ns;
26464f1b2e48SStefano Zampini       }
26474f1b2e48SStefano Zampini       ierr = PetscMalloc1(nzn,&new_idxs);CHKERRQ(ierr);
26484f1b2e48SStefano Zampini       nzn = 0;
26494f1b2e48SStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) {
26504f1b2e48SStefano Zampini         PetscInt ns,*idxs;
26514f1b2e48SStefano Zampini         ierr = ISGetLocalSize(zerodiag_subs[i],&ns);CHKERRQ(ierr);
26524f1b2e48SStefano Zampini         ierr = ISGetIndices(zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr);
26534f1b2e48SStefano Zampini         ierr = PetscMemcpy(new_idxs+nzn,idxs,ns*sizeof(PetscInt));CHKERRQ(ierr);
26544f1b2e48SStefano Zampini         ierr = ISRestoreIndices(zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr);
26554f1b2e48SStefano Zampini         nzn += ns;
26564f1b2e48SStefano Zampini       }
26574f1b2e48SStefano Zampini       ierr = PetscSortInt(nzn,new_idxs);CHKERRQ(ierr);
26584f1b2e48SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,nzn,new_idxs,PETSC_OWN_POINTER,&zerodiag);CHKERRQ(ierr);
26594f1b2e48SStefano Zampini     }
26604f1b2e48SStefano Zampini     have_null = PETSC_FALSE;
26614f1b2e48SStefano Zampini   }
26624f1b2e48SStefano Zampini 
2663669cc0f4SStefano Zampini   /* Prepare matrix to compute no-net-flux */
2664a198735bSStefano Zampini   if (pcbddc->compute_nonetflux && !pcbddc->divudotp) {
2665a198735bSStefano Zampini     Mat                    A,loc_divudotp;
2666a198735bSStefano Zampini     ISLocalToGlobalMapping rl2g,cl2g,l2gmap;
2667a198735bSStefano Zampini     IS                     row,col,isused = NULL;
2668a198735bSStefano Zampini     PetscInt               M,N,n,st,n_isused;
2669a198735bSStefano Zampini 
26701f4df5f7SStefano Zampini     if (pressures) {
26711f4df5f7SStefano Zampini       isused = pressures;
26721f4df5f7SStefano Zampini     } else {
26734edc6404Sstefano_zampini       isused = zerodiag_save;
26741f4df5f7SStefano Zampini     }
2675a198735bSStefano Zampini     ierr = MatGetLocalToGlobalMapping(pc->pmat,&l2gmap,NULL);CHKERRQ(ierr);
2676669cc0f4SStefano Zampini     ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr);
26771ae86dd6SStefano Zampini     ierr = MatGetLocalSize(A,&n,NULL);CHKERRQ(ierr);
26781ae86dd6SStefano Zampini     if (!isused && n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Don't know how to extract div u dot p! Please provide the pressure field");
2679a198735bSStefano Zampini     n_isused = 0;
2680a198735bSStefano Zampini     if (isused) {
2681a198735bSStefano Zampini       ierr = ISGetLocalSize(isused,&n_isused);CHKERRQ(ierr);
2682a198735bSStefano Zampini     }
2683a198735bSStefano Zampini     ierr = MPI_Scan(&n_isused,&st,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
2684a198735bSStefano Zampini     st = st-n_isused;
26851ae86dd6SStefano Zampini     if (n) {
2686a198735bSStefano Zampini       const PetscInt *gidxs;
2687a198735bSStefano Zampini 
26887dae84e0SHong Zhang       ierr = MatCreateSubMatrix(A,isused,NULL,MAT_INITIAL_MATRIX,&loc_divudotp);CHKERRQ(ierr);
2689a198735bSStefano Zampini       ierr = ISLocalToGlobalMappingGetIndices(l2gmap,&gidxs);CHKERRQ(ierr);
2690a198735bSStefano Zampini       /* TODO: extend ISCreateStride with st = PETSC_DECIDE */
2691a198735bSStefano Zampini       ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n_isused,st,1,&row);CHKERRQ(ierr);
2692a198735bSStefano Zampini       ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),n,gidxs,PETSC_COPY_VALUES,&col);CHKERRQ(ierr);
2693a198735bSStefano Zampini       ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap,&gidxs);CHKERRQ(ierr);
26941ae86dd6SStefano Zampini     } else {
2695a198735bSStefano Zampini       ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,0,0,1,NULL,&loc_divudotp);CHKERRQ(ierr);
2696a198735bSStefano Zampini       ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n_isused,st,1,&row);CHKERRQ(ierr);
2697a198735bSStefano Zampini       ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),0,NULL,PETSC_COPY_VALUES,&col);CHKERRQ(ierr);
2698a198735bSStefano Zampini     }
2699a198735bSStefano Zampini     ierr = MatGetSize(pc->pmat,NULL,&N);CHKERRQ(ierr);
2700a198735bSStefano Zampini     ierr = ISGetSize(row,&M);CHKERRQ(ierr);
2701a198735bSStefano Zampini     ierr = ISLocalToGlobalMappingCreateIS(row,&rl2g);CHKERRQ(ierr);
2702a198735bSStefano Zampini     ierr = ISLocalToGlobalMappingCreateIS(col,&cl2g);CHKERRQ(ierr);
2703a198735bSStefano Zampini     ierr = ISDestroy(&row);CHKERRQ(ierr);
2704a198735bSStefano Zampini     ierr = ISDestroy(&col);CHKERRQ(ierr);
2705a198735bSStefano Zampini     ierr = MatCreate(PetscObjectComm((PetscObject)pc),&pcbddc->divudotp);CHKERRQ(ierr);
2706a198735bSStefano Zampini     ierr = MatSetType(pcbddc->divudotp,MATIS);CHKERRQ(ierr);
2707a198735bSStefano Zampini     ierr = MatSetSizes(pcbddc->divudotp,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr);
2708a198735bSStefano Zampini     ierr = MatSetLocalToGlobalMapping(pcbddc->divudotp,rl2g,cl2g);CHKERRQ(ierr);
2709a198735bSStefano Zampini     ierr = ISLocalToGlobalMappingDestroy(&rl2g);CHKERRQ(ierr);
2710a198735bSStefano Zampini     ierr = ISLocalToGlobalMappingDestroy(&cl2g);CHKERRQ(ierr);
2711a198735bSStefano Zampini     ierr = MatISSetLocalMat(pcbddc->divudotp,loc_divudotp);CHKERRQ(ierr);
2712a198735bSStefano Zampini     ierr = MatDestroy(&loc_divudotp);CHKERRQ(ierr);
27131ae86dd6SStefano Zampini     ierr = MatAssemblyBegin(pcbddc->divudotp,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
27141ae86dd6SStefano Zampini     ierr = MatAssemblyEnd(pcbddc->divudotp,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
27151ae86dd6SStefano Zampini   }
27164edc6404Sstefano_zampini   ierr = ISDestroy(&zerodiag_save);CHKERRQ(ierr);
2717b3afcdbeSStefano Zampini 
2718b3afcdbeSStefano Zampini   /* change of basis and p0 dofs */
27194f1b2e48SStefano Zampini   if (has_null_pressures) {
27204f1b2e48SStefano Zampini     IS             zerodiagc;
27214f1b2e48SStefano Zampini     const PetscInt *idxs,*idxsc;
27224f1b2e48SStefano Zampini     PetscInt       i,s,*nnz;
27234f1b2e48SStefano Zampini 
27244f1b2e48SStefano Zampini     ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr);
2725339f8db1SStefano Zampini     ierr = ISComplement(zerodiag,0,n,&zerodiagc);CHKERRQ(ierr);
2726339f8db1SStefano Zampini     ierr = ISGetIndices(zerodiagc,&idxsc);CHKERRQ(ierr);
2727339f8db1SStefano Zampini     /* local change of basis for pressures */
2728339f8db1SStefano Zampini     ierr = MatDestroy(&pcbddc->benign_change);CHKERRQ(ierr);
272997d764eeSStefano Zampini     ierr = MatCreate(PetscObjectComm((PetscObject)pcbddc->local_mat),&pcbddc->benign_change);CHKERRQ(ierr);
2730339f8db1SStefano Zampini     ierr = MatSetType(pcbddc->benign_change,MATAIJ);CHKERRQ(ierr);
2731339f8db1SStefano Zampini     ierr = MatSetSizes(pcbddc->benign_change,n,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
2732339f8db1SStefano Zampini     ierr = PetscMalloc1(n,&nnz);CHKERRQ(ierr);
27334f1b2e48SStefano Zampini     for (i=0;i<n-nz;i++) nnz[idxsc[i]] = 1; /* identity on velocities plus pressure dofs for non-singular subdomains */
27344f1b2e48SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) {
27354f1b2e48SStefano Zampini       PetscInt nzs,j;
27364f1b2e48SStefano Zampini 
27374f1b2e48SStefano Zampini       ierr = ISGetLocalSize(zerodiag_subs[i],&nzs);CHKERRQ(ierr);
27384f1b2e48SStefano Zampini       ierr = ISGetIndices(zerodiag_subs[i],&idxs);CHKERRQ(ierr);
27394f1b2e48SStefano Zampini       for (j=0;j<nzs-1;j++) nnz[idxs[j]] = 2; /* change on pressures */
27404f1b2e48SStefano Zampini       nnz[idxs[nzs-1]] = nzs; /* last local pressure dof in subdomain */
27414f1b2e48SStefano Zampini       ierr = ISRestoreIndices(zerodiag_subs[i],&idxs);CHKERRQ(ierr);
27424f1b2e48SStefano Zampini     }
2743339f8db1SStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->benign_change,0,nnz);CHKERRQ(ierr);
2744339f8db1SStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2745339f8db1SStefano Zampini     /* set identity on velocities */
2746339f8db1SStefano Zampini     for (i=0;i<n-nz;i++) {
2747339f8db1SStefano Zampini       ierr = MatSetValue(pcbddc->benign_change,idxsc[i],idxsc[i],1.,INSERT_VALUES);CHKERRQ(ierr);
2748339f8db1SStefano Zampini     }
27494f1b2e48SStefano Zampini     ierr = ISRestoreIndices(zerodiagc,&idxsc);CHKERRQ(ierr);
27504f1b2e48SStefano Zampini     ierr = ISDestroy(&zerodiagc);CHKERRQ(ierr);
27519f47a83aSStefano Zampini     ierr = PetscFree3(pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx,pcbddc->benign_p0);CHKERRQ(ierr);
27524f1b2e48SStefano Zampini     ierr = PetscMalloc3(pcbddc->benign_n,&pcbddc->benign_p0_lidx,pcbddc->benign_n,&pcbddc->benign_p0_gidx,pcbddc->benign_n,&pcbddc->benign_p0);CHKERRQ(ierr);
2753339f8db1SStefano Zampini     /* set change on pressures */
27544f1b2e48SStefano Zampini     for (s=0;s<pcbddc->benign_n;s++) {
27554f1b2e48SStefano Zampini       PetscScalar *array;
27564f1b2e48SStefano Zampini       PetscInt    nzs;
27574f1b2e48SStefano Zampini 
27584f1b2e48SStefano Zampini       ierr = ISGetLocalSize(zerodiag_subs[s],&nzs);CHKERRQ(ierr);
27594f1b2e48SStefano Zampini       ierr = ISGetIndices(zerodiag_subs[s],&idxs);CHKERRQ(ierr);
27604f1b2e48SStefano Zampini       for (i=0;i<nzs-1;i++) {
2761339f8db1SStefano Zampini         PetscScalar vals[2];
2762339f8db1SStefano Zampini         PetscInt    cols[2];
2763339f8db1SStefano Zampini 
2764339f8db1SStefano Zampini         cols[0] = idxs[i];
27654f1b2e48SStefano Zampini         cols[1] = idxs[nzs-1];
2766339f8db1SStefano Zampini         vals[0] = 1.;
2767b0f5fe93SStefano Zampini         vals[1] = 1.;
27684f1b2e48SStefano Zampini         ierr = MatSetValues(pcbddc->benign_change,1,cols,2,cols,vals,INSERT_VALUES);CHKERRQ(ierr);
2769339f8db1SStefano Zampini       }
27704f1b2e48SStefano Zampini       ierr = PetscMalloc1(nzs,&array);CHKERRQ(ierr);
27714f1b2e48SStefano Zampini       for (i=0;i<nzs-1;i++) array[i] = -1.;
27724f1b2e48SStefano Zampini       array[nzs-1] = 1.;
27734f1b2e48SStefano Zampini       ierr = MatSetValues(pcbddc->benign_change,1,idxs+nzs-1,nzs,idxs,array,INSERT_VALUES);CHKERRQ(ierr);
27744f1b2e48SStefano Zampini       /* store local idxs for p0 */
27754f1b2e48SStefano Zampini       pcbddc->benign_p0_lidx[s] = idxs[nzs-1];
27764f1b2e48SStefano Zampini       ierr = ISRestoreIndices(zerodiag_subs[s],&idxs);CHKERRQ(ierr);
2777339f8db1SStefano Zampini       ierr = PetscFree(array);CHKERRQ(ierr);
27784f1b2e48SStefano Zampini     }
2779339f8db1SStefano Zampini     ierr = MatAssemblyBegin(pcbddc->benign_change,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2780339f8db1SStefano Zampini     ierr = MatAssemblyEnd(pcbddc->benign_change,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2781a3df083aSStefano Zampini     /* project if needed */
2782a3df083aSStefano Zampini     if (pcbddc->benign_change_explicit) {
27831dd7afcfSStefano Zampini       Mat M;
27841dd7afcfSStefano Zampini 
27851dd7afcfSStefano Zampini       ierr = MatPtAP(pcbddc->local_mat,pcbddc->benign_change,MAT_INITIAL_MATRIX,2.0,&M);CHKERRQ(ierr);
2786339f8db1SStefano Zampini       ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
27871dd7afcfSStefano Zampini       ierr = MatSeqAIJCompress(M,&pcbddc->local_mat);CHKERRQ(ierr);
27881dd7afcfSStefano Zampini       ierr = MatDestroy(&M);CHKERRQ(ierr);
2789a3df083aSStefano Zampini     }
27904f1b2e48SStefano Zampini     /* store global idxs for p0 */
27914f1b2e48SStefano Zampini     ierr = ISLocalToGlobalMappingApply(pc->pmat->rmap->mapping,pcbddc->benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx);CHKERRQ(ierr);
2792339f8db1SStefano Zampini   }
2793ca92afb2SStefano Zampini   pcbddc->benign_zerodiag_subs = zerodiag_subs;
27944f1b2e48SStefano Zampini   ierr = ISDestroy(&pressures);CHKERRQ(ierr);
2795b0f5fe93SStefano Zampini 
2796b0f5fe93SStefano Zampini   /* determines if the coarse solver will be singular or not */
2797b0f5fe93SStefano Zampini   ierr = MPI_Allreduce(&have_null,&pcbddc->benign_null,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
279827b6a85dSStefano Zampini   /* determines if the problem has subdomains with 0 pressure block */
279927b6a85dSStefano Zampini   ierr = MPI_Allreduce(&have_null,&pcbddc->benign_have_null,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
2800339f8db1SStefano Zampini   *zerodiaglocal = zerodiag;
2801339f8db1SStefano Zampini   PetscFunctionReturn(0);
2802339f8db1SStefano Zampini }
2803339f8db1SStefano Zampini 
2804015636ebSStefano Zampini PetscErrorCode PCBDDCBenignGetOrSetP0(PC pc, Vec v, PetscBool get)
2805efc2fbd9SStefano Zampini {
2806efc2fbd9SStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
2807de9d7bd0SStefano Zampini   PetscScalar    *array;
2808efc2fbd9SStefano Zampini   PetscErrorCode ierr;
2809efc2fbd9SStefano Zampini 
2810efc2fbd9SStefano Zampini   PetscFunctionBegin;
2811efc2fbd9SStefano Zampini   if (!pcbddc->benign_sf) {
2812efc2fbd9SStefano Zampini     ierr = PetscSFCreate(PetscObjectComm((PetscObject)pc),&pcbddc->benign_sf);CHKERRQ(ierr);
28134f1b2e48SStefano Zampini     ierr = PetscSFSetGraphLayout(pcbddc->benign_sf,pc->pmat->rmap,pcbddc->benign_n,NULL,PETSC_OWN_POINTER,pcbddc->benign_p0_gidx);CHKERRQ(ierr);
2814efc2fbd9SStefano Zampini   }
2815de9d7bd0SStefano Zampini   if (get) {
2816efc2fbd9SStefano Zampini     ierr = VecGetArrayRead(v,(const PetscScalar**)&array);CHKERRQ(ierr);
28174f1b2e48SStefano Zampini     ierr = PetscSFBcastBegin(pcbddc->benign_sf,MPIU_SCALAR,array,pcbddc->benign_p0);CHKERRQ(ierr);
28184f1b2e48SStefano Zampini     ierr = PetscSFBcastEnd(pcbddc->benign_sf,MPIU_SCALAR,array,pcbddc->benign_p0);CHKERRQ(ierr);
2819efc2fbd9SStefano Zampini     ierr = VecRestoreArrayRead(v,(const PetscScalar**)&array);CHKERRQ(ierr);
2820de9d7bd0SStefano Zampini   } else {
2821de9d7bd0SStefano Zampini     ierr = VecGetArray(v,&array);CHKERRQ(ierr);
2822de9d7bd0SStefano Zampini     ierr = PetscSFReduceBegin(pcbddc->benign_sf,MPIU_SCALAR,pcbddc->benign_p0,array,MPIU_REPLACE);CHKERRQ(ierr);
2823de9d7bd0SStefano Zampini     ierr = PetscSFReduceEnd(pcbddc->benign_sf,MPIU_SCALAR,pcbddc->benign_p0,array,MPIU_REPLACE);CHKERRQ(ierr);
2824de9d7bd0SStefano Zampini     ierr = VecRestoreArray(v,&array);CHKERRQ(ierr);
2825efc2fbd9SStefano Zampini   }
2826efc2fbd9SStefano Zampini   PetscFunctionReturn(0);
2827efc2fbd9SStefano Zampini }
2828efc2fbd9SStefano Zampini 
2829c263805aSStefano Zampini PetscErrorCode PCBDDCBenignPopOrPushB0(PC pc, PetscBool pop)
2830c263805aSStefano Zampini {
2831c263805aSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
2832c263805aSStefano Zampini   PetscErrorCode ierr;
2833c263805aSStefano Zampini 
2834c263805aSStefano Zampini   PetscFunctionBegin;
2835c263805aSStefano Zampini   /* TODO: add error checking
2836c263805aSStefano Zampini     - avoid nested pop (or push) calls.
2837c263805aSStefano Zampini     - cannot push before pop.
28381c604dc7SStefano Zampini     - cannot call this if pcbddc->local_mat is NULL
2839c263805aSStefano Zampini   */
28404f1b2e48SStefano Zampini   if (!pcbddc->benign_n) {
2841efc2fbd9SStefano Zampini     PetscFunctionReturn(0);
2842efc2fbd9SStefano Zampini   }
2843c263805aSStefano Zampini   if (pop) {
2844a3df083aSStefano Zampini     if (pcbddc->benign_change_explicit) {
28454f1b2e48SStefano Zampini       IS       is_p0;
28464f1b2e48SStefano Zampini       MatReuse reuse;
2847c263805aSStefano Zampini 
2848c263805aSStefano Zampini       /* extract B_0 */
28494f1b2e48SStefano Zampini       reuse = MAT_INITIAL_MATRIX;
28504f1b2e48SStefano Zampini       if (pcbddc->benign_B0) {
28514f1b2e48SStefano Zampini         reuse = MAT_REUSE_MATRIX;
28524f1b2e48SStefano Zampini       }
28534f1b2e48SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->benign_n,pcbddc->benign_p0_lidx,PETSC_COPY_VALUES,&is_p0);CHKERRQ(ierr);
28547dae84e0SHong Zhang       ierr = MatCreateSubMatrix(pcbddc->local_mat,is_p0,NULL,reuse,&pcbddc->benign_B0);CHKERRQ(ierr);
2855c263805aSStefano Zampini       /* remove rows and cols from local problem */
2856c263805aSStefano Zampini       ierr = MatSetOption(pcbddc->local_mat,MAT_KEEP_NONZERO_PATTERN,PETSC_TRUE);CHKERRQ(ierr);
285797d764eeSStefano Zampini       ierr = MatSetOption(pcbddc->local_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
28584f1b2e48SStefano Zampini       ierr = MatZeroRowsColumnsIS(pcbddc->local_mat,is_p0,1.0,NULL,NULL);CHKERRQ(ierr);
28594f1b2e48SStefano Zampini       ierr = ISDestroy(&is_p0);CHKERRQ(ierr);
2860a3df083aSStefano Zampini     } else {
2861a3df083aSStefano Zampini       Mat_IS      *matis = (Mat_IS*)pc->pmat->data;
2862a3df083aSStefano Zampini       PetscScalar *vals;
2863a3df083aSStefano Zampini       PetscInt    i,n,*idxs_ins;
2864a3df083aSStefano Zampini 
2865a3df083aSStefano Zampini       ierr = VecGetLocalSize(matis->y,&n);CHKERRQ(ierr);
2866a3df083aSStefano Zampini       ierr = PetscMalloc2(n,&idxs_ins,n,&vals);CHKERRQ(ierr);
2867a3df083aSStefano Zampini       if (!pcbddc->benign_B0) {
28680b5adadeSStefano Zampini         PetscInt *nnz;
2869a3df083aSStefano Zampini         ierr = MatCreate(PetscObjectComm((PetscObject)pcbddc->local_mat),&pcbddc->benign_B0);CHKERRQ(ierr);
2870a3df083aSStefano Zampini         ierr = MatSetType(pcbddc->benign_B0,MATAIJ);CHKERRQ(ierr);
2871a3df083aSStefano Zampini         ierr = MatSetSizes(pcbddc->benign_B0,pcbddc->benign_n,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
2872331e053bSStefano Zampini         ierr = PetscMalloc1(pcbddc->benign_n,&nnz);CHKERRQ(ierr);
2873331e053bSStefano Zampini         for (i=0;i<pcbddc->benign_n;i++) {
2874331e053bSStefano Zampini           ierr = ISGetLocalSize(pcbddc->benign_zerodiag_subs[i],&nnz[i]);CHKERRQ(ierr);
2875331e053bSStefano Zampini           nnz[i] = n - nnz[i];
2876331e053bSStefano Zampini         }
2877331e053bSStefano Zampini         ierr = MatSeqAIJSetPreallocation(pcbddc->benign_B0,0,nnz);CHKERRQ(ierr);
2878331e053bSStefano Zampini         ierr = PetscFree(nnz);CHKERRQ(ierr);
2879331e053bSStefano Zampini       }
2880a3df083aSStefano Zampini 
2881a3df083aSStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) {
2882a3df083aSStefano Zampini         PetscScalar *array;
2883a3df083aSStefano Zampini         PetscInt    *idxs,j,nz,cum;
2884a3df083aSStefano Zampini 
2885a3df083aSStefano Zampini         ierr = VecSet(matis->x,0.);CHKERRQ(ierr);
2886a3df083aSStefano Zampini         ierr = ISGetLocalSize(pcbddc->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr);
2887a3df083aSStefano Zampini         ierr = ISGetIndices(pcbddc->benign_zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr);
2888a3df083aSStefano Zampini         for (j=0;j<nz;j++) vals[j] = 1.;
2889a3df083aSStefano Zampini         ierr = VecSetValues(matis->x,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
2890a3df083aSStefano Zampini         ierr = VecAssemblyBegin(matis->x);CHKERRQ(ierr);
2891a3df083aSStefano Zampini         ierr = VecAssemblyEnd(matis->x);CHKERRQ(ierr);
2892a3df083aSStefano Zampini         ierr = VecSet(matis->y,0.);CHKERRQ(ierr);
2893a3df083aSStefano Zampini         ierr = MatMult(matis->A,matis->x,matis->y);CHKERRQ(ierr);
2894a3df083aSStefano Zampini         ierr = VecGetArray(matis->y,&array);CHKERRQ(ierr);
2895a3df083aSStefano Zampini         cum = 0;
2896a3df083aSStefano Zampini         for (j=0;j<n;j++) {
289722db5ddcSStefano Zampini           if (PetscUnlikely(PetscAbsScalar(array[j]) > PETSC_SMALL)) {
2898a3df083aSStefano Zampini             vals[cum] = array[j];
2899a3df083aSStefano Zampini             idxs_ins[cum] = j;
2900a3df083aSStefano Zampini             cum++;
2901a3df083aSStefano Zampini           }
2902a3df083aSStefano Zampini         }
2903a3df083aSStefano Zampini         ierr = MatSetValues(pcbddc->benign_B0,1,&i,cum,idxs_ins,vals,INSERT_VALUES);CHKERRQ(ierr);
2904a3df083aSStefano Zampini         ierr = VecRestoreArray(matis->y,&array);CHKERRQ(ierr);
2905a3df083aSStefano Zampini         ierr = ISRestoreIndices(pcbddc->benign_zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr);
2906a3df083aSStefano Zampini       }
2907a3df083aSStefano Zampini       ierr = MatAssemblyBegin(pcbddc->benign_B0,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2908a3df083aSStefano Zampini       ierr = MatAssemblyEnd(pcbddc->benign_B0,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2909a3df083aSStefano Zampini       ierr = PetscFree2(idxs_ins,vals);CHKERRQ(ierr);
2910a3df083aSStefano Zampini     }
2911c263805aSStefano Zampini   } else { /* push */
2912a3df083aSStefano Zampini     if (pcbddc->benign_change_explicit) {
29134f1b2e48SStefano Zampini       PetscInt i;
29144f1b2e48SStefano Zampini 
29154f1b2e48SStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) {
29164f1b2e48SStefano Zampini         PetscScalar *B0_vals;
29174f1b2e48SStefano Zampini         PetscInt    *B0_cols,B0_ncol;
29184f1b2e48SStefano Zampini 
29194f1b2e48SStefano Zampini         ierr = MatGetRow(pcbddc->benign_B0,i,&B0_ncol,(const PetscInt**)&B0_cols,(const PetscScalar**)&B0_vals);CHKERRQ(ierr);
29204f1b2e48SStefano Zampini         ierr = MatSetValues(pcbddc->local_mat,1,pcbddc->benign_p0_lidx+i,B0_ncol,B0_cols,B0_vals,INSERT_VALUES);CHKERRQ(ierr);
29217b034428SStefano Zampini         ierr = MatSetValues(pcbddc->local_mat,B0_ncol,B0_cols,1,pcbddc->benign_p0_lidx+i,B0_vals,INSERT_VALUES);CHKERRQ(ierr);
29224f1b2e48SStefano Zampini         ierr = MatSetValue(pcbddc->local_mat,pcbddc->benign_p0_lidx[i],pcbddc->benign_p0_lidx[i],0.0,INSERT_VALUES);CHKERRQ(ierr);
29234f1b2e48SStefano Zampini         ierr = MatRestoreRow(pcbddc->benign_B0,i,&B0_ncol,(const PetscInt**)&B0_cols,(const PetscScalar**)&B0_vals);CHKERRQ(ierr);
29244f1b2e48SStefano Zampini       }
2925c263805aSStefano Zampini       ierr = MatAssemblyBegin(pcbddc->local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2926c263805aSStefano Zampini       ierr = MatAssemblyEnd(pcbddc->local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2927a3df083aSStefano Zampini     } else {
2928a3df083aSStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Cannot push B0!\n");
2929a3df083aSStefano Zampini     }
2930c263805aSStefano Zampini   }
2931c263805aSStefano Zampini   PetscFunctionReturn(0);
2932c263805aSStefano Zampini }
2933c263805aSStefano Zampini 
293408122e43SStefano Zampini PetscErrorCode PCBDDCAdaptiveSelection(PC pc)
2935b1b3d7a2SStefano Zampini {
2936b1b3d7a2SStefano Zampini   PC_BDDC*        pcbddc = (PC_BDDC*)pc->data;
293708122e43SStefano Zampini   PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
293808122e43SStefano Zampini   PetscBLASInt    B_dummyint,B_neigs,B_ierr,B_lwork;
293908122e43SStefano Zampini   PetscBLASInt    *B_iwork,*B_ifail;
294008122e43SStefano Zampini   PetscScalar     *work,lwork;
294108122e43SStefano Zampini   PetscScalar     *St,*S,*eigv;
294208122e43SStefano Zampini   PetscScalar     *Sarray,*Starray;
294308122e43SStefano Zampini   PetscReal       *eigs,thresh;
29441b968477SStefano Zampini   PetscInt        i,nmax,nmin,nv,cum,mss,cum2,cumarray,maxneigs;
2945f6f667cfSStefano Zampini   PetscBool       allocated_S_St;
294608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX)
294708122e43SStefano Zampini   PetscReal       *rwork;
294808122e43SStefano Zampini #endif
2949b1b3d7a2SStefano Zampini   PetscErrorCode  ierr;
2950b1b3d7a2SStefano Zampini 
2951b1b3d7a2SStefano Zampini   PetscFunctionBegin;
2952b334f244SStefano Zampini   if (!sub_schurs) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Adaptive selection of constraints requires SubSchurs data");
2953af25d912SStefano Zampini   if (!sub_schurs->schur_explicit) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Adaptive selection of constraints requires MUMPS and/or MKL_CPARDISO");
2954d750e150Sstefano_zampini   if (sub_schurs->n_subs && (!sub_schurs->is_hermitian || !sub_schurs->is_posdef)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Adaptive selection not yet implemented for general matrix pencils (herm %d, posdef %d)\nRerun with -sub_schurs_hermitian 1 -sub_schurs_posdef 1 if the problem is SPD",sub_schurs->is_hermitian,sub_schurs->is_posdef);
295506a4e24aSStefano Zampini 
2956fd14bc51SStefano Zampini   if (pcbddc->dbg_flag) {
2957fd14bc51SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
2958fd14bc51SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
2959fd14bc51SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check adaptive selection of constraints\n");CHKERRQ(ierr);
29601575c14dSBarry Smith     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
2961fd14bc51SStefano Zampini   }
2962fd14bc51SStefano Zampini 
2963e496cd5dSStefano Zampini   if (pcbddc->dbg_flag) {
2964e496cd5dSStefano Zampini     PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d cc %d (%d,%d).\n",PetscGlobalRank,sub_schurs->n_subs,sub_schurs->is_hermitian,sub_schurs->is_posdef);
2965e496cd5dSStefano Zampini   }
2966e496cd5dSStefano Zampini 
296708122e43SStefano Zampini   /* max size of subsets */
296808122e43SStefano Zampini   mss = 0;
296908122e43SStefano Zampini   for (i=0;i<sub_schurs->n_subs;i++) {
297008122e43SStefano Zampini     PetscInt subset_size;
2971862806e4SStefano Zampini 
297208122e43SStefano Zampini     ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr);
297308122e43SStefano Zampini     mss = PetscMax(mss,subset_size);
297408122e43SStefano Zampini   }
297508122e43SStefano Zampini 
297608122e43SStefano Zampini   /* min/max and threshold */
297708122e43SStefano Zampini   nmax = pcbddc->adaptive_nmax > 0 ? pcbddc->adaptive_nmax : mss;
2978f6f667cfSStefano Zampini   nmin = pcbddc->adaptive_nmin > 0 ? pcbddc->adaptive_nmin : 0;
297908122e43SStefano Zampini   nmax = PetscMax(nmin,nmax);
2980f6f667cfSStefano Zampini   allocated_S_St = PETSC_FALSE;
2981f6f667cfSStefano Zampini   if (nmin) {
2982f6f667cfSStefano Zampini     allocated_S_St = PETSC_TRUE;
2983f6f667cfSStefano Zampini   }
298408122e43SStefano Zampini 
298508122e43SStefano Zampini   /* allocate lapack workspace */
298608122e43SStefano Zampini   cum = cum2 = 0;
298708122e43SStefano Zampini   maxneigs = 0;
298808122e43SStefano Zampini   for (i=0;i<sub_schurs->n_subs;i++) {
298908122e43SStefano Zampini     PetscInt n,subset_size;
2990f6f667cfSStefano Zampini 
299108122e43SStefano Zampini     ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr);
299208122e43SStefano Zampini     n = PetscMin(subset_size,nmax);
29939162d606SStefano Zampini     cum += subset_size;
29949162d606SStefano Zampini     cum2 += subset_size*n;
299508122e43SStefano Zampini     maxneigs = PetscMax(maxneigs,n);
299608122e43SStefano Zampini   }
299708122e43SStefano Zampini   if (mss) {
29989ab7bb16SStefano Zampini     if (sub_schurs->is_hermitian && sub_schurs->is_posdef) {
299908122e43SStefano Zampini       PetscBLASInt B_itype = 1;
300008122e43SStefano Zampini       PetscBLASInt B_N = mss;
30014c6709b3SStefano Zampini       PetscReal    zero = 0.0;
30024c6709b3SStefano Zampini       PetscReal    eps = 0.0; /* dlamch? */
300308122e43SStefano Zampini 
300408122e43SStefano Zampini       B_lwork = -1;
300508122e43SStefano Zampini       S = NULL;
300608122e43SStefano Zampini       St = NULL;
3007a58a30b4SStefano Zampini       eigs = NULL;
3008a58a30b4SStefano Zampini       eigv = NULL;
3009a58a30b4SStefano Zampini       B_iwork = NULL;
3010a58a30b4SStefano Zampini       B_ifail = NULL;
3011d1710679SStefano Zampini #if defined(PETSC_USE_COMPLEX)
3012d1710679SStefano Zampini       rwork = NULL;
3013d1710679SStefano Zampini #endif
30148bec7fa6SStefano Zampini       thresh = 1.0;
301508122e43SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
301608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX)
301708122e43SStefano Zampini       PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&zero,&thresh,&B_dummyint,&B_dummyint,&eps,&B_neigs,eigs,eigv,&B_N,&lwork,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr));
301808122e43SStefano Zampini #else
301908122e43SStefano Zampini       PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&zero,&thresh,&B_dummyint,&B_dummyint,&eps,&B_neigs,eigs,eigv,&B_N,&lwork,&B_lwork,B_iwork,B_ifail,&B_ierr));
302008122e43SStefano Zampini #endif
302108122e43SStefano Zampini       if (B_ierr != 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYGVX Lapack routine %d",(int)B_ierr);
302208122e43SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
302308122e43SStefano Zampini     } else {
302408122e43SStefano Zampini         /* TODO */
302508122e43SStefano Zampini     }
302608122e43SStefano Zampini   } else {
302708122e43SStefano Zampini     lwork = 0;
302808122e43SStefano Zampini   }
302908122e43SStefano Zampini 
303008122e43SStefano Zampini   nv = 0;
3031d62866d3SStefano Zampini   if (sub_schurs->is_vertices && pcbddc->use_vertices) { /* complement set of active subsets, each entry is a vertex (boundary made by active subsets, vertices and dirichlet dofs) */
3032d62866d3SStefano Zampini     ierr = ISGetLocalSize(sub_schurs->is_vertices,&nv);CHKERRQ(ierr);
303308122e43SStefano Zampini   }
30344c6709b3SStefano Zampini   ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&B_lwork);CHKERRQ(ierr);
3035f6f667cfSStefano Zampini   if (allocated_S_St) {
3036f6f667cfSStefano Zampini     ierr = PetscMalloc2(mss*mss,&S,mss*mss,&St);CHKERRQ(ierr);
3037f6f667cfSStefano Zampini   }
3038f6f667cfSStefano Zampini   ierr = PetscMalloc5(mss*mss,&eigv,mss,&eigs,B_lwork,&work,5*mss,&B_iwork,mss,&B_ifail);CHKERRQ(ierr);
303908122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX)
304008122e43SStefano Zampini   ierr = PetscMalloc1(7*mss,&rwork);CHKERRQ(ierr);
304108122e43SStefano Zampini #endif
30429162d606SStefano Zampini   ierr = PetscMalloc5(nv+sub_schurs->n_subs,&pcbddc->adaptive_constraints_n,
30439162d606SStefano Zampini                       nv+sub_schurs->n_subs+1,&pcbddc->adaptive_constraints_idxs_ptr,
30449162d606SStefano Zampini                       nv+sub_schurs->n_subs+1,&pcbddc->adaptive_constraints_data_ptr,
304508122e43SStefano Zampini                       nv+cum,&pcbddc->adaptive_constraints_idxs,
30469162d606SStefano Zampini                       nv+cum2,&pcbddc->adaptive_constraints_data);CHKERRQ(ierr);
304708122e43SStefano Zampini   ierr = PetscMemzero(pcbddc->adaptive_constraints_n,(nv+sub_schurs->n_subs)*sizeof(PetscInt));CHKERRQ(ierr);
304808122e43SStefano Zampini 
304908122e43SStefano Zampini   maxneigs = 0;
305072b8c272SStefano Zampini   cum = cumarray = 0;
30519162d606SStefano Zampini   pcbddc->adaptive_constraints_idxs_ptr[0] = 0;
30529162d606SStefano Zampini   pcbddc->adaptive_constraints_data_ptr[0] = 0;
3053d62866d3SStefano Zampini   if (sub_schurs->is_vertices && pcbddc->use_vertices) {
305408122e43SStefano Zampini     const PetscInt *idxs;
305508122e43SStefano Zampini 
3056d62866d3SStefano Zampini     ierr = ISGetIndices(sub_schurs->is_vertices,&idxs);CHKERRQ(ierr);
305708122e43SStefano Zampini     for (cum=0;cum<nv;cum++) {
305808122e43SStefano Zampini       pcbddc->adaptive_constraints_n[cum] = 1;
305908122e43SStefano Zampini       pcbddc->adaptive_constraints_idxs[cum] = idxs[cum];
306008122e43SStefano Zampini       pcbddc->adaptive_constraints_data[cum] = 1.0;
30619162d606SStefano Zampini       pcbddc->adaptive_constraints_idxs_ptr[cum+1] = pcbddc->adaptive_constraints_idxs_ptr[cum]+1;
30629162d606SStefano Zampini       pcbddc->adaptive_constraints_data_ptr[cum+1] = pcbddc->adaptive_constraints_data_ptr[cum]+1;
306308122e43SStefano Zampini     }
3064d62866d3SStefano Zampini     ierr = ISRestoreIndices(sub_schurs->is_vertices,&idxs);CHKERRQ(ierr);
306508122e43SStefano Zampini   }
306608122e43SStefano Zampini 
306708122e43SStefano Zampini   if (mss) { /* multilevel */
306808122e43SStefano Zampini     ierr = MatSeqAIJGetArray(sub_schurs->sum_S_Ej_inv_all,&Sarray);CHKERRQ(ierr);
306908122e43SStefano Zampini     ierr = MatSeqAIJGetArray(sub_schurs->sum_S_Ej_tilda_all,&Starray);CHKERRQ(ierr);
307008122e43SStefano Zampini   }
307108122e43SStefano Zampini 
3072ffd830a3SStefano Zampini   thresh = pcbddc->adaptive_threshold;
307308122e43SStefano Zampini   for (i=0;i<sub_schurs->n_subs;i++) {
307408122e43SStefano Zampini     const PetscInt *idxs;
30759d54b7f4SStefano Zampini     PetscReal      upper,lower;
3076862806e4SStefano Zampini     PetscInt       j,subset_size,eigs_start = 0;
307708122e43SStefano Zampini     PetscBLASInt   B_N;
3078aff50787SStefano Zampini     PetscBool      same_data = PETSC_FALSE;
307908122e43SStefano Zampini 
30809d54b7f4SStefano Zampini     if (pcbddc->use_deluxe_scaling) {
30819d54b7f4SStefano Zampini       upper = PETSC_MAX_REAL;
30829d54b7f4SStefano Zampini       lower = thresh;
30839d54b7f4SStefano Zampini     } else {
30849d54b7f4SStefano Zampini       upper = 1./thresh;
30859d54b7f4SStefano Zampini       lower = 0.;
30869d54b7f4SStefano Zampini     }
3087862806e4SStefano Zampini     ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr);
3088ffd830a3SStefano Zampini     ierr = ISGetIndices(sub_schurs->is_subs[i],&idxs);CHKERRQ(ierr);
3089f6f667cfSStefano Zampini     ierr = PetscBLASIntCast(subset_size,&B_N);CHKERRQ(ierr);
3090f6f667cfSStefano Zampini     if (allocated_S_St) { /* S and S_t should be copied since we could need them later */
30919ab7bb16SStefano Zampini       if (sub_schurs->is_hermitian) {
3092aff50787SStefano Zampini         PetscInt j,k;
3093aff50787SStefano Zampini         if (sub_schurs->n_subs == 1) { /* zeroing memory to use PetscMemcmp later */
3094aff50787SStefano Zampini           ierr = PetscMemzero(S,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
3095aff50787SStefano Zampini           ierr = PetscMemzero(St,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
309608122e43SStefano Zampini         }
309708122e43SStefano Zampini         for (j=0;j<subset_size;j++) {
3098aff50787SStefano Zampini           for (k=j;k<subset_size;k++) {
3099aff50787SStefano Zampini             S [j*subset_size+k] = Sarray [cumarray+j*subset_size+k];
3100aff50787SStefano Zampini             St[j*subset_size+k] = Starray[cumarray+j*subset_size+k];
3101aff50787SStefano Zampini           }
310208122e43SStefano Zampini         }
310308122e43SStefano Zampini       } else {
310408122e43SStefano Zampini         ierr = PetscMemcpy(S,Sarray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
310508122e43SStefano Zampini         ierr = PetscMemcpy(St,Starray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
310608122e43SStefano Zampini       }
31078bec7fa6SStefano Zampini     } else {
3108f6f667cfSStefano Zampini       S = Sarray + cumarray;
3109f6f667cfSStefano Zampini       St = Starray + cumarray;
31108bec7fa6SStefano Zampini     }
3111aff50787SStefano Zampini     /* see if we can save some work */
3112b7ab4a40SStefano Zampini     if (sub_schurs->n_subs == 1 && pcbddc->use_deluxe_scaling) {
3113aff50787SStefano Zampini       ierr = PetscMemcmp(S,St,subset_size*subset_size*sizeof(PetscScalar),&same_data);CHKERRQ(ierr);
3114aff50787SStefano Zampini     }
3115aff50787SStefano Zampini 
3116b7ab4a40SStefano Zampini     if (same_data && !sub_schurs->change) { /* there's no need of constraints here */
3117aff50787SStefano Zampini       B_neigs = 0;
3118aff50787SStefano Zampini     } else {
31199ab7bb16SStefano Zampini       if (sub_schurs->is_hermitian && sub_schurs->is_posdef) {
312008122e43SStefano Zampini         PetscBLASInt B_itype = 1;
3121f6f667cfSStefano Zampini         PetscBLASInt B_IL, B_IU;
31224c6709b3SStefano Zampini         PetscReal    eps = -1.0; /* dlamch? */
31239552c7c7SStefano Zampini         PetscInt     nmin_s;
3124b7ab4a40SStefano Zampini         PetscBool    compute_range = PETSC_FALSE;
312508122e43SStefano Zampini 
3126fd14bc51SStefano Zampini         if (pcbddc->dbg_flag) {
3127eee23b56SStefano Zampini           PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Computing for sub %d/%d size %d count %d fid %d.\n",i,sub_schurs->n_subs,subset_size,pcbddc->mat_graph->count[idxs[0]]+1,pcbddc->mat_graph->which_dof[idxs[0]]);
3128fd14bc51SStefano Zampini         }
3129d16cbb6bSStefano Zampini 
3130b7ab4a40SStefano Zampini         compute_range = PETSC_FALSE;
3131b7ab4a40SStefano Zampini         if (thresh > 1.+PETSC_SMALL && !same_data) {
3132b7ab4a40SStefano Zampini           compute_range = PETSC_TRUE;
3133b7ab4a40SStefano Zampini         }
3134b7ab4a40SStefano Zampini 
313508122e43SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
3136b7ab4a40SStefano Zampini         if (compute_range) {
3137d16cbb6bSStefano Zampini 
3138d16cbb6bSStefano Zampini           /* ask for eigenvalues larger than thresh */
313908122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX)
31409d54b7f4SStefano Zampini           PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr));
314108122e43SStefano Zampini #else
31429d54b7f4SStefano Zampini           PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr));
314308122e43SStefano Zampini #endif
3144b7ab4a40SStefano Zampini         } else if (!same_data) {
3145d16cbb6bSStefano Zampini           B_IU = PetscMax(1,PetscMin(B_N,nmax));
3146d16cbb6bSStefano Zampini           B_IL = 1;
3147d16cbb6bSStefano Zampini #if defined(PETSC_USE_COMPLEX)
31489d54b7f4SStefano Zampini           PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr));
3149d16cbb6bSStefano Zampini #else
31509d54b7f4SStefano Zampini           PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr));
3151d16cbb6bSStefano Zampini #endif
3152b03ebc13SStefano Zampini         } else { /* same_data is true, so just get the adaptive functional requested by the user */
3153b7ab4a40SStefano Zampini           PetscInt k;
3154b7ab4a40SStefano Zampini           if (!sub_schurs->change_primal_sub) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen");
3155b7ab4a40SStefano Zampini           ierr = ISGetLocalSize(sub_schurs->change_primal_sub[i],&nmax);CHKERRQ(ierr);
3156b7ab4a40SStefano Zampini           ierr = PetscBLASIntCast(nmax,&B_neigs);CHKERRQ(ierr);
3157b7ab4a40SStefano Zampini           nmin = nmax;
3158b7ab4a40SStefano Zampini           ierr = PetscMemzero(eigv,subset_size*nmax*sizeof(PetscScalar));CHKERRQ(ierr);
3159b7ab4a40SStefano Zampini           for (k=0;k<nmax;k++) {
3160b7ab4a40SStefano Zampini             eigs[k] = 1./PETSC_SMALL;
3161b7ab4a40SStefano Zampini             eigv[k*(subset_size+1)] = 1.0;
3162b7ab4a40SStefano Zampini           }
3163d16cbb6bSStefano Zampini         }
316408122e43SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
316508122e43SStefano Zampini         if (B_ierr) {
31666c4ed002SBarry Smith           if (B_ierr < 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: illegal value for argument %d",-(int)B_ierr);
31676c4ed002SBarry Smith           else if (B_ierr <= B_N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: %d eigenvalues failed to converge",(int)B_ierr);
31686c4ed002SBarry Smith           else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: leading minor of order %d is not positive definite",(int)B_ierr-B_N-1);
316908122e43SStefano Zampini         }
317008122e43SStefano Zampini 
317108122e43SStefano Zampini         if (B_neigs > nmax) {
3172fd14bc51SStefano Zampini           if (pcbddc->dbg_flag) {
3173fd14bc51SStefano Zampini             PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"   found %d eigs, more than maximum required %d.\n",B_neigs,nmax);
3174fd14bc51SStefano Zampini           }
31759d54b7f4SStefano Zampini           if (pcbddc->use_deluxe_scaling) eigs_start = B_neigs -nmax;
317608122e43SStefano Zampini           B_neigs = nmax;
317708122e43SStefano Zampini         }
317808122e43SStefano Zampini 
31799552c7c7SStefano Zampini         nmin_s = PetscMin(nmin,B_N);
31809552c7c7SStefano Zampini         if (B_neigs < nmin_s) {
318108122e43SStefano Zampini           PetscBLASInt B_neigs2;
318208122e43SStefano Zampini 
31839d54b7f4SStefano Zampini           if (pcbddc->use_deluxe_scaling) {
3184f6f667cfSStefano Zampini             B_IL = B_N - nmin_s + 1;
31859d54b7f4SStefano Zampini             B_IU = B_N - B_neigs;
31869d54b7f4SStefano Zampini           } else {
31879d54b7f4SStefano Zampini             B_IL = B_neigs + 1;
31889d54b7f4SStefano Zampini             B_IU = nmin_s;
31899d54b7f4SStefano Zampini           }
3190fd14bc51SStefano Zampini           if (pcbddc->dbg_flag) {
3191fd14bc51SStefano Zampini             PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"   found %d eigs, less than minimum required %d. Asking for %d to %d incl (fortran like)\n",B_neigs,nmin,B_IL,B_IU);
3192fd14bc51SStefano Zampini           }
31939ab7bb16SStefano Zampini           if (sub_schurs->is_hermitian) {
31941ae86dd6SStefano Zampini             PetscInt j,k;
319508122e43SStefano Zampini             for (j=0;j<subset_size;j++) {
31961ae86dd6SStefano Zampini               for (k=j;k<subset_size;k++) {
31971ae86dd6SStefano Zampini                 S [j*subset_size+k] = Sarray [cumarray+j*subset_size+k];
31981ae86dd6SStefano Zampini                 St[j*subset_size+k] = Starray[cumarray+j*subset_size+k];
319908122e43SStefano Zampini               }
320008122e43SStefano Zampini             }
320108122e43SStefano Zampini           } else {
320208122e43SStefano Zampini             ierr = PetscMemcpy(S,Sarray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
320308122e43SStefano Zampini             ierr = PetscMemcpy(St,Starray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
320408122e43SStefano Zampini           }
320508122e43SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
320608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX)
32079d54b7f4SStefano Zampini           PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs2,eigs+B_neigs,eigv+B_neigs*subset_size,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr));
320808122e43SStefano Zampini #else
32099d54b7f4SStefano Zampini           PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs2,eigs+B_neigs,eigv+B_neigs*subset_size,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr));
321008122e43SStefano Zampini #endif
321108122e43SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
321208122e43SStefano Zampini           B_neigs += B_neigs2;
321308122e43SStefano Zampini         }
321408122e43SStefano Zampini         if (B_ierr) {
32156c4ed002SBarry Smith           if (B_ierr < 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: illegal value for argument %d",-(int)B_ierr);
32166c4ed002SBarry Smith           else if (B_ierr <= B_N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: %d eigenvalues failed to converge",(int)B_ierr);
32176c4ed002SBarry Smith           else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: leading minor of order %d is not positive definite",(int)B_ierr-B_N-1);
321808122e43SStefano Zampini         }
3219fd14bc51SStefano Zampini         if (pcbddc->dbg_flag) {
3220ac47001eSStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"   -> Got %d eigs\n",B_neigs);CHKERRQ(ierr);
322108122e43SStefano Zampini           for (j=0;j<B_neigs;j++) {
322208122e43SStefano Zampini             if (eigs[j] == 0.0) {
3223ac47001eSStefano Zampini               ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"     Inf\n");CHKERRQ(ierr);
322408122e43SStefano Zampini             } else {
32259d54b7f4SStefano Zampini               if (pcbddc->use_deluxe_scaling) {
3226ac47001eSStefano Zampini                 ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"     %1.6e\n",eigs[j+eigs_start]);CHKERRQ(ierr);
32279d54b7f4SStefano Zampini               } else {
32289d54b7f4SStefano Zampini                 ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"     %1.6e\n",1./eigs[j+eigs_start]);CHKERRQ(ierr);
32299d54b7f4SStefano Zampini               }
3230fd14bc51SStefano Zampini             }
323108122e43SStefano Zampini           }
323208122e43SStefano Zampini         }
323308122e43SStefano Zampini       } else {
323408122e43SStefano Zampini           /* TODO */
323508122e43SStefano Zampini       }
3236aff50787SStefano Zampini     }
32376c3e6151SStefano Zampini     /* change the basis back to the original one */
32386c3e6151SStefano Zampini     if (sub_schurs->change) {
323972b8c272SStefano Zampini       Mat change,phi,phit;
32406c3e6151SStefano Zampini 
32416c3e6151SStefano Zampini       if (pcbddc->dbg_flag > 1) {
32426c3e6151SStefano Zampini         PetscInt ii;
32436c3e6151SStefano Zampini         for (ii=0;ii<B_neigs;ii++) {
32446c3e6151SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"   -> Eigenvector (old basis) %d/%d (%d)\n",ii,B_neigs,B_N);CHKERRQ(ierr);
32456c3e6151SStefano Zampini           for (j=0;j<B_N;j++) {
3246684229deSStefano Zampini #if defined(PETSC_USE_COMPLEX)
3247684229deSStefano Zampini             PetscReal r = PetscRealPart(eigv[(ii+eigs_start)*subset_size+j]);
3248684229deSStefano Zampini             PetscReal c = PetscImaginaryPart(eigv[(ii+eigs_start)*subset_size+j]);
3249684229deSStefano Zampini             ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"       %1.4e + %1.4e i\n",r,c);CHKERRQ(ierr);
3250684229deSStefano Zampini #else
32516c3e6151SStefano Zampini             ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"       %1.4e\n",eigv[(ii+eigs_start)*subset_size+j]);CHKERRQ(ierr);
3252684229deSStefano Zampini #endif
32536c3e6151SStefano Zampini           }
32546c3e6151SStefano Zampini         }
32556c3e6151SStefano Zampini       }
325672b8c272SStefano Zampini       ierr = KSPGetOperators(sub_schurs->change[i],&change,NULL);CHKERRQ(ierr);
32576c3e6151SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,subset_size,B_neigs,eigv+eigs_start*subset_size,&phit);CHKERRQ(ierr);
325872b8c272SStefano Zampini       ierr = MatMatMult(change,phit,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&phi);CHKERRQ(ierr);
32596c3e6151SStefano Zampini       ierr = MatCopy(phi,phit,SAME_NONZERO_PATTERN);CHKERRQ(ierr);
32606c3e6151SStefano Zampini       ierr = MatDestroy(&phit);CHKERRQ(ierr);
32616c3e6151SStefano Zampini       ierr = MatDestroy(&phi);CHKERRQ(ierr);
32626c3e6151SStefano Zampini     }
32638bec7fa6SStefano Zampini     maxneigs = PetscMax(B_neigs,maxneigs);
32648bec7fa6SStefano Zampini     pcbddc->adaptive_constraints_n[i+nv] = B_neigs;
32659162d606SStefano Zampini     if (B_neigs) {
32669162d606SStefano Zampini       ierr = PetscMemcpy(pcbddc->adaptive_constraints_data+pcbddc->adaptive_constraints_data_ptr[cum],eigv+eigs_start*subset_size,B_neigs*subset_size*sizeof(PetscScalar));CHKERRQ(ierr);
3267fd14bc51SStefano Zampini 
3268fd14bc51SStefano Zampini       if (pcbddc->dbg_flag > 1) {
32699552c7c7SStefano Zampini         PetscInt ii;
32709552c7c7SStefano Zampini         for (ii=0;ii<B_neigs;ii++) {
3271ac47001eSStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"   -> Eigenvector %d/%d (%d)\n",ii,B_neigs,B_N);CHKERRQ(ierr);
32729552c7c7SStefano Zampini           for (j=0;j<B_N;j++) {
3273ac47001eSStefano Zampini #if defined(PETSC_USE_COMPLEX)
3274ac47001eSStefano Zampini             PetscReal r = PetscRealPart(pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]);
3275ac47001eSStefano Zampini             PetscReal c = PetscImaginaryPart(pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]);
3276ac47001eSStefano Zampini             ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"       %1.4e + %1.4e i\n",r,c);CHKERRQ(ierr);
3277ac47001eSStefano Zampini #else
3278ac47001eSStefano Zampini             ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"       %1.4e\n",pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]);CHKERRQ(ierr);
3279ac47001eSStefano Zampini #endif
32809552c7c7SStefano Zampini           }
32819552c7c7SStefano Zampini         }
3282fd14bc51SStefano Zampini       }
32839162d606SStefano Zampini       ierr = PetscMemcpy(pcbddc->adaptive_constraints_idxs+pcbddc->adaptive_constraints_idxs_ptr[cum],idxs,subset_size*sizeof(PetscInt));CHKERRQ(ierr);
32849162d606SStefano Zampini       pcbddc->adaptive_constraints_idxs_ptr[cum+1] = pcbddc->adaptive_constraints_idxs_ptr[cum] + subset_size;
32859162d606SStefano Zampini       pcbddc->adaptive_constraints_data_ptr[cum+1] = pcbddc->adaptive_constraints_data_ptr[cum] + subset_size*B_neigs;
32869162d606SStefano Zampini       cum++;
328708122e43SStefano Zampini     }
328808122e43SStefano Zampini     ierr = ISRestoreIndices(sub_schurs->is_subs[i],&idxs);CHKERRQ(ierr);
328908122e43SStefano Zampini     /* shift for next computation */
329008122e43SStefano Zampini     cumarray += subset_size*subset_size;
329108122e43SStefano Zampini   }
3292fd14bc51SStefano Zampini   if (pcbddc->dbg_flag) {
3293fd14bc51SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
3294fd14bc51SStefano Zampini   }
329508122e43SStefano Zampini 
329608122e43SStefano Zampini   if (mss) {
329708122e43SStefano Zampini     ierr = MatSeqAIJRestoreArray(sub_schurs->sum_S_Ej_inv_all,&Sarray);CHKERRQ(ierr);
329808122e43SStefano Zampini     ierr = MatSeqAIJRestoreArray(sub_schurs->sum_S_Ej_tilda_all,&Starray);CHKERRQ(ierr);
3299f6f667cfSStefano Zampini     /* destroy matrices (junk) */
3300f6f667cfSStefano Zampini     ierr = MatDestroy(&sub_schurs->sum_S_Ej_inv_all);CHKERRQ(ierr);
3301f6f667cfSStefano Zampini     ierr = MatDestroy(&sub_schurs->sum_S_Ej_tilda_all);CHKERRQ(ierr);
330208122e43SStefano Zampini   }
3303f6f667cfSStefano Zampini   if (allocated_S_St) {
3304f6f667cfSStefano Zampini     ierr = PetscFree2(S,St);CHKERRQ(ierr);
3305f6f667cfSStefano Zampini   }
3306f6f667cfSStefano Zampini   ierr = PetscFree5(eigv,eigs,work,B_iwork,B_ifail);CHKERRQ(ierr);
330708122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX)
330808122e43SStefano Zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
330908122e43SStefano Zampini #endif
331008122e43SStefano Zampini   if (pcbddc->dbg_flag) {
33111b968477SStefano Zampini     PetscInt maxneigs_r;
3312b2566f29SBarry Smith     ierr = MPIU_Allreduce(&maxneigs,&maxneigs_r,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
33139b28b941SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Maximum number of constraints per cc %d\n",maxneigs_r);CHKERRQ(ierr);
331408122e43SStefano Zampini   }
331508122e43SStefano Zampini   PetscFunctionReturn(0);
331608122e43SStefano Zampini }
3317b1b3d7a2SStefano Zampini 
3318c8587f34SStefano Zampini PetscErrorCode PCBDDCSetUpSolvers(PC pc)
3319c8587f34SStefano Zampini {
33208629588bSStefano Zampini   PetscScalar    *coarse_submat_vals;
3321c8587f34SStefano Zampini   PetscErrorCode ierr;
3322c8587f34SStefano Zampini 
3323c8587f34SStefano Zampini   PetscFunctionBegin;
3324f4ddd8eeSStefano Zampini   /* Setup local scatters R_to_B and (optionally) R_to_D */
33255e8657edSStefano Zampini   /* PCBDDCSetUpLocalWorkVectors should be called first! */
3326c8587f34SStefano Zampini   ierr = PCBDDCSetUpLocalScatters(pc);CHKERRQ(ierr);
3327c8587f34SStefano Zampini 
3328684f6988SStefano Zampini   /* Setup local neumann solver ksp_R */
33290fccc4e9SStefano Zampini   /* PCBDDCSetUpLocalScatters should be called first! */
3330684f6988SStefano Zampini   ierr = PCBDDCSetUpLocalSolvers(pc,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr);
3331c8587f34SStefano Zampini 
33328629588bSStefano Zampini   /*
33338629588bSStefano Zampini      Setup local correction and local part of coarse basis.
33348629588bSStefano Zampini      Gives back the dense local part of the coarse matrix in column major ordering
33358629588bSStefano Zampini   */
333647f4ddc3SStefano Zampini   ierr = PCBDDCSetUpCorrection(pc,&coarse_submat_vals);CHKERRQ(ierr);
33378629588bSStefano Zampini 
33388629588bSStefano Zampini   /* Compute total number of coarse nodes and setup coarse solver */
33398629588bSStefano Zampini   ierr = PCBDDCSetUpCoarseSolver(pc,coarse_submat_vals);CHKERRQ(ierr);
33408629588bSStefano Zampini 
33418629588bSStefano Zampini   /* free */
33428629588bSStefano Zampini   ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
3343c8587f34SStefano Zampini   PetscFunctionReturn(0);
3344c8587f34SStefano Zampini }
3345c8587f34SStefano Zampini 
3346674ae819SStefano Zampini PetscErrorCode PCBDDCResetCustomization(PC pc)
3347674ae819SStefano Zampini {
3348674ae819SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
3349674ae819SStefano Zampini   PetscErrorCode ierr;
3350674ae819SStefano Zampini 
3351674ae819SStefano Zampini   PetscFunctionBegin;
3352674ae819SStefano Zampini   ierr = ISDestroy(&pcbddc->user_primal_vertices);CHKERRQ(ierr);
335330368db7SStefano Zampini   ierr = ISDestroy(&pcbddc->user_primal_vertices_local);CHKERRQ(ierr);
3354674ae819SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
3355785d1243SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr);
3356674ae819SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
3357f4ddd8eeSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->onearnullspace);CHKERRQ(ierr);
3358f4ddd8eeSStefano Zampini   ierr = PetscFree(pcbddc->onearnullvecs_state);CHKERRQ(ierr);
3359785d1243SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr);
336063602bcaSStefano Zampini   ierr = PCBDDCSetDofsSplitting(pc,0,NULL);CHKERRQ(ierr);
336163602bcaSStefano Zampini   ierr = PCBDDCSetDofsSplittingLocal(pc,0,NULL);CHKERRQ(ierr);
3362674ae819SStefano Zampini   PetscFunctionReturn(0);
3363674ae819SStefano Zampini }
3364674ae819SStefano Zampini 
3365674ae819SStefano Zampini PetscErrorCode PCBDDCResetTopography(PC pc)
3366674ae819SStefano Zampini {
3367674ae819SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
33684f1b2e48SStefano Zampini   PetscInt       i;
3369674ae819SStefano Zampini   PetscErrorCode ierr;
3370674ae819SStefano Zampini 
3371674ae819SStefano Zampini   PetscFunctionBegin;
33721e0482f5SStefano Zampini   ierr = MatDestroy(&pcbddc->nedcG);CHKERRQ(ierr);
33731e0482f5SStefano Zampini   ierr = ISDestroy(&pcbddc->nedclocal);CHKERRQ(ierr);
3374a13144ffSStefano Zampini   ierr = MatDestroy(&pcbddc->discretegradient);CHKERRQ(ierr);
3375b9b85e73SStefano Zampini   ierr = MatDestroy(&pcbddc->user_ChangeOfBasisMatrix);CHKERRQ(ierr);
3376674ae819SStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
337716909a7fSStefano Zampini   ierr = MatDestroy(&pcbddc->switch_static_change);CHKERRQ(ierr);
33781dd7afcfSStefano Zampini   ierr = VecDestroy(&pcbddc->work_change);CHKERRQ(ierr);
3379674ae819SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
3380669cc0f4SStefano Zampini   ierr = MatDestroy(&pcbddc->divudotp);CHKERRQ(ierr);
3381fa23a32eSStefano Zampini   ierr = ISDestroy(&pcbddc->divudotp_vl2l);CHKERRQ(ierr);
33829326c5c6Sstefano_zampini   ierr = PCBDDCGraphDestroy(&pcbddc->mat_graph);CHKERRQ(ierr);
33834f1b2e48SStefano Zampini   for (i=0;i<pcbddc->n_local_subs;i++) {
33844f1b2e48SStefano Zampini     ierr = ISDestroy(&pcbddc->local_subs[i]);CHKERRQ(ierr);
33854f1b2e48SStefano Zampini   }
3386e68a0315Sstefano_zampini   pcbddc->n_local_subs = 0;
33874f1b2e48SStefano Zampini   ierr = PetscFree(pcbddc->local_subs);CHKERRQ(ierr);
3388e68a0315Sstefano_zampini   ierr = PCBDDCSubSchursDestroy(&pcbddc->sub_schurs);CHKERRQ(ierr);
3389c703fcc7SStefano Zampini   pcbddc->graphanalyzed        = PETSC_FALSE;
33908af8fcf9SStefano Zampini   pcbddc->recompute_topography = PETSC_TRUE;
3391674ae819SStefano Zampini   PetscFunctionReturn(0);
3392674ae819SStefano Zampini }
3393674ae819SStefano Zampini 
3394674ae819SStefano Zampini PetscErrorCode PCBDDCResetSolvers(PC pc)
3395674ae819SStefano Zampini {
3396674ae819SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
3397674ae819SStefano Zampini   PetscErrorCode ierr;
3398674ae819SStefano Zampini 
3399674ae819SStefano Zampini   PetscFunctionBegin;
3400674ae819SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
340158da7f69SStefano Zampini   if (pcbddc->coarse_phi_B) {
3402ca92afb2SStefano Zampini     PetscScalar *array;
340306656605SStefano Zampini     ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&array);CHKERRQ(ierr);
340406656605SStefano Zampini     ierr = PetscFree(array);CHKERRQ(ierr);
340558da7f69SStefano Zampini   }
3406674ae819SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
3407674ae819SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
340815aaf578SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_psi_B);CHKERRQ(ierr);
340915aaf578SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_psi_D);CHKERRQ(ierr);
3410674ae819SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
3411674ae819SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
3412674ae819SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
341306656605SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
3414674ae819SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
3415674ae819SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
34168ce42a96SStefano Zampini   ierr = ISDestroy(&pcbddc->is_R_local);CHKERRQ(ierr);
3417674ae819SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
3418674ae819SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
3419674ae819SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
34209326c5c6Sstefano_zampini   ierr = KSPReset(pcbddc->ksp_D);CHKERRQ(ierr);
34219326c5c6Sstefano_zampini   ierr = KSPReset(pcbddc->ksp_R);CHKERRQ(ierr);
34229326c5c6Sstefano_zampini   ierr = KSPReset(pcbddc->coarse_ksp);CHKERRQ(ierr);
3423f4ddd8eeSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
3424727cdba6SStefano Zampini   ierr = PetscFree(pcbddc->primal_indices_local_idxs);CHKERRQ(ierr);
34250e6343abSStefano Zampini   ierr = PetscFree2(pcbddc->local_primal_ref_node,pcbddc->local_primal_ref_mult);CHKERRQ(ierr);
3426f4ddd8eeSStefano Zampini   ierr = PetscFree(pcbddc->global_primal_indices);CHKERRQ(ierr);
342770cf5478SStefano Zampini   ierr = ISDestroy(&pcbddc->coarse_subassembling);CHKERRQ(ierr);
342881d14e9dSStefano Zampini   ierr = MatDestroy(&pcbddc->benign_change);CHKERRQ(ierr);
34290369aaf7SStefano Zampini   ierr = VecDestroy(&pcbddc->benign_vec);CHKERRQ(ierr);
34301dd7afcfSStefano Zampini   ierr = PCBDDCBenignShellMat(pc,PETSC_TRUE);CHKERRQ(ierr);
34314f1b2e48SStefano Zampini   ierr = MatDestroy(&pcbddc->benign_B0);CHKERRQ(ierr);
34328b9f24d4SStefano Zampini   ierr = PetscSFDestroy(&pcbddc->benign_sf);CHKERRQ(ierr);
3433ca92afb2SStefano Zampini   if (pcbddc->benign_zerodiag_subs) {
3434ca92afb2SStefano Zampini     PetscInt i;
3435ca92afb2SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) {
3436ca92afb2SStefano Zampini       ierr = ISDestroy(&pcbddc->benign_zerodiag_subs[i]);CHKERRQ(ierr);
3437ca92afb2SStefano Zampini     }
3438ca92afb2SStefano Zampini     ierr = PetscFree(pcbddc->benign_zerodiag_subs);CHKERRQ(ierr);
3439ca92afb2SStefano Zampini   }
34404f1b2e48SStefano Zampini   ierr = PetscFree3(pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx,pcbddc->benign_p0);CHKERRQ(ierr);
3441674ae819SStefano Zampini   PetscFunctionReturn(0);
3442674ae819SStefano Zampini }
3443674ae819SStefano Zampini 
3444f4ddd8eeSStefano Zampini PetscErrorCode PCBDDCSetUpLocalWorkVectors(PC pc)
34456bfb1811SStefano Zampini {
34466bfb1811SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
34476bfb1811SStefano Zampini   PC_IS          *pcis = (PC_IS*)pc->data;
34486bfb1811SStefano Zampini   VecType        impVecType;
34494f1b2e48SStefano Zampini   PetscInt       n_constraints,n_R,old_size;
34506bfb1811SStefano Zampini   PetscErrorCode ierr;
34516bfb1811SStefano Zampini 
34526bfb1811SStefano Zampini   PetscFunctionBegin;
34534f1b2e48SStefano Zampini   n_constraints = pcbddc->local_primal_size - pcbddc->benign_n - pcbddc->n_vertices;
3454b371cd4fSStefano Zampini   n_R = pcis->n - pcbddc->n_vertices;
34556bfb1811SStefano Zampini   ierr = VecGetType(pcis->vec1_N,&impVecType);CHKERRQ(ierr);
3456e7b262bdSStefano Zampini   /* local work vectors (try to avoid unneeded work)*/
3457e7b262bdSStefano Zampini   /* R nodes */
3458e7b262bdSStefano Zampini   old_size = -1;
3459e7b262bdSStefano Zampini   if (pcbddc->vec1_R) {
3460e7b262bdSStefano Zampini     ierr = VecGetSize(pcbddc->vec1_R,&old_size);CHKERRQ(ierr);
3461e7b262bdSStefano Zampini   }
3462e7b262bdSStefano Zampini   if (n_R != old_size) {
3463e7b262bdSStefano Zampini     ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
3464e7b262bdSStefano Zampini     ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
34656bfb1811SStefano Zampini     ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_R);CHKERRQ(ierr);
34666bfb1811SStefano Zampini     ierr = VecSetSizes(pcbddc->vec1_R,PETSC_DECIDE,n_R);CHKERRQ(ierr);
34676bfb1811SStefano Zampini     ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
34686bfb1811SStefano Zampini     ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
3469e7b262bdSStefano Zampini   }
3470e7b262bdSStefano Zampini   /* local primal dofs */
3471e7b262bdSStefano Zampini   old_size = -1;
3472e7b262bdSStefano Zampini   if (pcbddc->vec1_P) {
3473e7b262bdSStefano Zampini     ierr = VecGetSize(pcbddc->vec1_P,&old_size);CHKERRQ(ierr);
3474e7b262bdSStefano Zampini   }
3475e9189074SStefano Zampini   if (pcbddc->local_primal_size != old_size) {
3476e7b262bdSStefano Zampini     ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
347783b7ccabSStefano Zampini     ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_P);CHKERRQ(ierr);
3478e9189074SStefano Zampini     ierr = VecSetSizes(pcbddc->vec1_P,PETSC_DECIDE,pcbddc->local_primal_size);CHKERRQ(ierr);
34796bfb1811SStefano Zampini     ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
3480e7b262bdSStefano Zampini   }
3481e7b262bdSStefano Zampini   /* local explicit constraints */
3482e7b262bdSStefano Zampini   old_size = -1;
3483e7b262bdSStefano Zampini   if (pcbddc->vec1_C) {
3484e7b262bdSStefano Zampini     ierr = VecGetSize(pcbddc->vec1_C,&old_size);CHKERRQ(ierr);
3485e7b262bdSStefano Zampini   }
3486e7b262bdSStefano Zampini   if (n_constraints && n_constraints != old_size) {
3487e7b262bdSStefano Zampini     ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
348883b7ccabSStefano Zampini     ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_C);CHKERRQ(ierr);
348983b7ccabSStefano Zampini     ierr = VecSetSizes(pcbddc->vec1_C,PETSC_DECIDE,n_constraints);CHKERRQ(ierr);
349083b7ccabSStefano Zampini     ierr = VecSetType(pcbddc->vec1_C,impVecType);CHKERRQ(ierr);
349183b7ccabSStefano Zampini   }
34926bfb1811SStefano Zampini   PetscFunctionReturn(0);
34936bfb1811SStefano Zampini }
34946bfb1811SStefano Zampini 
349547f4ddc3SStefano Zampini PetscErrorCode PCBDDCSetUpCorrection(PC pc, PetscScalar **coarse_submat_vals_n)
349688ebb749SStefano Zampini {
349725084f0cSStefano Zampini   PetscErrorCode  ierr;
349825084f0cSStefano Zampini   /* pointers to pcis and pcbddc */
349988ebb749SStefano Zampini   PC_IS*          pcis = (PC_IS*)pc->data;
350088ebb749SStefano Zampini   PC_BDDC*        pcbddc = (PC_BDDC*)pc->data;
3501d62866d3SStefano Zampini   PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
350225084f0cSStefano Zampini   /* submatrices of local problem */
350380677318SStefano Zampini   Mat             A_RV,A_VR,A_VV,local_auxmat2_R;
350406656605SStefano Zampini   /* submatrices of local coarse problem */
350506656605SStefano Zampini   Mat             S_VV,S_CV,S_VC,S_CC;
350625084f0cSStefano Zampini   /* working matrices */
350706656605SStefano Zampini   Mat             C_CR;
350825084f0cSStefano Zampini   /* additional working stuff */
350906656605SStefano Zampini   PC              pc_R;
3510c58f9fdbSStefano Zampini   Mat             F,Brhs = NULL;
35115cbda25cSStefano Zampini   Vec             dummy_vec;
3512c58f9fdbSStefano Zampini   PetscBool       isLU,isCHOL,isILU,need_benign_correction,sparserhs;
351325084f0cSStefano Zampini   PetscScalar     *coarse_submat_vals; /* TODO: use a PETSc matrix */
351406656605SStefano Zampini   PetscScalar     *work;
351506656605SStefano Zampini   PetscInt        *idx_V_B;
3516ffd830a3SStefano Zampini   PetscInt        lda_rhs,n,n_vertices,n_constraints,*p0_lidx_I;
351706656605SStefano Zampini   PetscInt        i,n_R,n_D,n_B;
3518ffd830a3SStefano Zampini 
351925084f0cSStefano Zampini   /* some shortcuts to scalars */
352006656605SStefano Zampini   PetscScalar     one=1.0,m_one=-1.0;
352188ebb749SStefano Zampini 
352288ebb749SStefano Zampini   PetscFunctionBegin;
35239a962809SStefano Zampini   if (!pcbddc->symmetric_primal && pcbddc->benign_n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Non-symmetric primal basis computation with benign trick not yet implemented");
3524ffd830a3SStefano Zampini 
3525ffd830a3SStefano Zampini   /* Set Non-overlapping dimensions */
3526b371cd4fSStefano Zampini   n_vertices = pcbddc->n_vertices;
35274f1b2e48SStefano Zampini   n_constraints = pcbddc->local_primal_size - pcbddc->benign_n - n_vertices;
3528b371cd4fSStefano Zampini   n_B = pcis->n_B;
3529b371cd4fSStefano Zampini   n_D = pcis->n - n_B;
353088ebb749SStefano Zampini   n_R = pcis->n - n_vertices;
353188ebb749SStefano Zampini 
353288ebb749SStefano Zampini   /* vertices in boundary numbering */
3533785e854fSJed Brown   ierr = PetscMalloc1(n_vertices,&idx_V_B);CHKERRQ(ierr);
35340e6343abSStefano Zampini   ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,n_vertices,pcbddc->local_primal_ref_node,&i,idx_V_B);CHKERRQ(ierr);
35356c4ed002SBarry Smith   if (i != n_vertices) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for BDDC vertices! %D != %D\n",n_vertices,i);
353688ebb749SStefano Zampini 
353706656605SStefano Zampini   /* Subdomain contribution (Non-overlapping) to coarse matrix  */
3538019a44ceSStefano Zampini   ierr = PetscCalloc1(pcbddc->local_primal_size*pcbddc->local_primal_size,&coarse_submat_vals);CHKERRQ(ierr);
353906656605SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_vertices,n_vertices,coarse_submat_vals,&S_VV);CHKERRQ(ierr);
354006656605SStefano Zampini   ierr = MatSeqDenseSetLDA(S_VV,pcbddc->local_primal_size);CHKERRQ(ierr);
354106656605SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_constraints,n_vertices,coarse_submat_vals+n_vertices,&S_CV);CHKERRQ(ierr);
354206656605SStefano Zampini   ierr = MatSeqDenseSetLDA(S_CV,pcbddc->local_primal_size);CHKERRQ(ierr);
354306656605SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_vertices,n_constraints,coarse_submat_vals+pcbddc->local_primal_size*n_vertices,&S_VC);CHKERRQ(ierr);
354406656605SStefano Zampini   ierr = MatSeqDenseSetLDA(S_VC,pcbddc->local_primal_size);CHKERRQ(ierr);
354506656605SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_constraints,n_constraints,coarse_submat_vals+(pcbddc->local_primal_size+1)*n_vertices,&S_CC);CHKERRQ(ierr);
354606656605SStefano Zampini   ierr = MatSeqDenseSetLDA(S_CC,pcbddc->local_primal_size);CHKERRQ(ierr);
354706656605SStefano Zampini 
354806656605SStefano Zampini   /* determine if can use MatSolve routines instead of calling KSPSolve on ksp_R */
354906656605SStefano Zampini   ierr = KSPGetPC(pcbddc->ksp_R,&pc_R);CHKERRQ(ierr);
355006656605SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCLU,&isLU);CHKERRQ(ierr);
355106656605SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCILU,&isILU);CHKERRQ(ierr);
355206656605SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCCHOLESKY,&isCHOL);CHKERRQ(ierr);
3553ffd830a3SStefano Zampini   lda_rhs = n_R;
3554a3df083aSStefano Zampini   need_benign_correction = PETSC_FALSE;
355506656605SStefano Zampini   if (isLU || isILU || isCHOL) {
355606656605SStefano Zampini     ierr = PCFactorGetMatrix(pc_R,&F);CHKERRQ(ierr);
3557b334f244SStefano Zampini   } else if (sub_schurs && sub_schurs->reuse_solver) {
3558df4d28bfSStefano Zampini     PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
3559d62866d3SStefano Zampini     MatFactorType      type;
3560d62866d3SStefano Zampini 
3561df4d28bfSStefano Zampini     F = reuse_solver->F;
35626816873aSStefano Zampini     ierr = MatGetFactorType(F,&type);CHKERRQ(ierr);
3563d62866d3SStefano Zampini     if (type == MAT_FACTOR_CHOLESKY) isCHOL = PETSC_TRUE;
3564ffd830a3SStefano Zampini     ierr = MatGetSize(F,&lda_rhs,NULL);CHKERRQ(ierr);
356522db5ddcSStefano Zampini     need_benign_correction = (PetscBool)(!!reuse_solver->benign_n);
356606656605SStefano Zampini   } else {
356706656605SStefano Zampini     F = NULL;
356806656605SStefano Zampini   }
356906656605SStefano Zampini 
3570c58f9fdbSStefano Zampini   /* determine if we can use a sparse right-hand side */
3571c58f9fdbSStefano Zampini   sparserhs = PETSC_FALSE;
3572c58f9fdbSStefano Zampini   if (F) {
3573c58f9fdbSStefano Zampini     const MatSolverPackage solver;
3574c58f9fdbSStefano Zampini 
3575c58f9fdbSStefano Zampini     ierr = MatFactorGetSolverPackage(F,&solver);CHKERRQ(ierr);
3576c58f9fdbSStefano Zampini     ierr = PetscStrcmp(solver,MATSOLVERMUMPS,&sparserhs);CHKERRQ(ierr);
3577c58f9fdbSStefano Zampini   }
3578c58f9fdbSStefano Zampini 
3579ffd830a3SStefano Zampini   /* allocate workspace */
3580ffd830a3SStefano Zampini   n = 0;
3581ffd830a3SStefano Zampini   if (n_constraints) {
3582ffd830a3SStefano Zampini     n += lda_rhs*n_constraints;
3583ffd830a3SStefano Zampini   }
3584ffd830a3SStefano Zampini   if (n_vertices) {
3585ffd830a3SStefano Zampini     n = PetscMax(2*lda_rhs*n_vertices,n);
3586ffd830a3SStefano Zampini     n = PetscMax((lda_rhs+n_B)*n_vertices,n);
3587ffd830a3SStefano Zampini   }
35882a3a6641Sstefano_zampini   if (!pcbddc->symmetric_primal) {
35892a3a6641Sstefano_zampini     n = PetscMax(2*lda_rhs*pcbddc->local_primal_size,n);
35902a3a6641Sstefano_zampini   }
3591ffd830a3SStefano Zampini   ierr = PetscMalloc1(n,&work);CHKERRQ(ierr);
3592ffd830a3SStefano Zampini 
35935cbda25cSStefano Zampini   /* create dummy vector to modify rhs and sol of MatMatSolve (work array will never be used) */
35945cbda25cSStefano Zampini   dummy_vec = NULL;
35955cbda25cSStefano Zampini   if (need_benign_correction && lda_rhs != n_R && F) {
35965cbda25cSStefano Zampini     ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lda_rhs,work,&dummy_vec);CHKERRQ(ierr);
35975cbda25cSStefano Zampini   }
35985cbda25cSStefano Zampini 
359988ebb749SStefano Zampini   /* Precompute stuffs needed for preprocessing and application of BDDC*/
360088ebb749SStefano Zampini   if (n_constraints) {
360172b8c272SStefano Zampini     Mat         M1,M2,M3,C_B;
360206656605SStefano Zampini     IS          is_aux;
360380677318SStefano Zampini     PetscScalar *array,*array2;
360406656605SStefano Zampini 
3605f4ddd8eeSStefano Zampini     ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
360680677318SStefano Zampini     ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
360788ebb749SStefano Zampini 
360825084f0cSStefano Zampini     /* Extract constraints on R nodes: C_{CR}  */
360925084f0cSStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_aux);CHKERRQ(ierr);
36107dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_aux,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
36117dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_aux,pcis->is_B_local,MAT_INITIAL_MATRIX,&C_B);CHKERRQ(ierr);
361288ebb749SStefano Zampini 
361380677318SStefano Zampini     /* Assemble         local_auxmat2_R =        (- A_{RR}^{-1} C^T_{CR}) needed by BDDC setup */
361480677318SStefano Zampini     /* Assemble pcbddc->local_auxmat2   = R_to_B (- A_{RR}^{-1} C^T_{CR}) needed by BDDC application */
3615c58f9fdbSStefano Zampini     if (!sparserhs) {
3616ffd830a3SStefano Zampini       ierr = PetscMemzero(work,lda_rhs*n_constraints*sizeof(PetscScalar));CHKERRQ(ierr);
361788ebb749SStefano Zampini       for (i=0;i<n_constraints;i++) {
361806656605SStefano Zampini         const PetscScalar *row_cmat_values;
361906656605SStefano Zampini         const PetscInt    *row_cmat_indices;
362006656605SStefano Zampini         PetscInt          size_of_constraint,j;
362188ebb749SStefano Zampini 
362206656605SStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,&row_cmat_indices,&row_cmat_values);CHKERRQ(ierr);
362306656605SStefano Zampini         for (j=0;j<size_of_constraint;j++) {
3624ffd830a3SStefano Zampini           work[row_cmat_indices[j]+i*lda_rhs] = -row_cmat_values[j];
362506656605SStefano Zampini         }
362606656605SStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,&row_cmat_indices,&row_cmat_values);CHKERRQ(ierr);
362706656605SStefano Zampini       }
3628c58f9fdbSStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,work,&Brhs);CHKERRQ(ierr);
3629c58f9fdbSStefano Zampini     } else {
3630c58f9fdbSStefano Zampini       Mat tC_CR;
3631c58f9fdbSStefano Zampini 
3632c58f9fdbSStefano Zampini       ierr = MatScale(C_CR,-1.0);CHKERRQ(ierr);
3633c58f9fdbSStefano Zampini       if (lda_rhs != n_R) {
3634c58f9fdbSStefano Zampini         PetscScalar *aa;
3635c58f9fdbSStefano Zampini         PetscInt    r,*ii,*jj;
3636c58f9fdbSStefano Zampini         PetscBool   done;
3637c58f9fdbSStefano Zampini 
3638c58f9fdbSStefano Zampini         ierr = MatGetRowIJ(C_CR,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
363913903a91SSatish Balay         if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"GetRowIJ failed");
3640c58f9fdbSStefano Zampini         ierr = MatSeqAIJGetArray(C_CR,&aa);CHKERRQ(ierr);
3641c58f9fdbSStefano Zampini         ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,n_constraints,lda_rhs,ii,jj,aa,&tC_CR);CHKERRQ(ierr);
3642c58f9fdbSStefano Zampini         ierr = MatRestoreRowIJ(C_CR,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
364313903a91SSatish Balay         if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"RestoreRowIJ failed");
3644c58f9fdbSStefano Zampini       } else {
3645c58f9fdbSStefano Zampini         ierr  = PetscObjectReference((PetscObject)C_CR);CHKERRQ(ierr);
3646c58f9fdbSStefano Zampini         tC_CR = C_CR;
3647c58f9fdbSStefano Zampini       }
3648c58f9fdbSStefano Zampini       ierr = MatCreateTranspose(tC_CR,&Brhs);CHKERRQ(ierr);
3649c58f9fdbSStefano Zampini       ierr = MatDestroy(&tC_CR);CHKERRQ(ierr);
3650c58f9fdbSStefano Zampini     }
3651ffd830a3SStefano Zampini     ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,NULL,&local_auxmat2_R);CHKERRQ(ierr);
365206656605SStefano Zampini     if (F) {
3653a3df083aSStefano Zampini       if (need_benign_correction) {
3654df4d28bfSStefano Zampini         PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
3655a3df083aSStefano Zampini 
365672b8c272SStefano Zampini         /* rhs is already zero on interior dofs, no need to change the rhs */
365772b8c272SStefano Zampini         ierr = PetscMemzero(reuse_solver->benign_save_vals,pcbddc->benign_n*sizeof(PetscScalar));CHKERRQ(ierr);
3658a3df083aSStefano Zampini       }
3659c58f9fdbSStefano Zampini       ierr = MatMatSolve(F,Brhs,local_auxmat2_R);CHKERRQ(ierr);
3660a3df083aSStefano Zampini       if (need_benign_correction) {
3661a3df083aSStefano Zampini         PetscScalar        *marr;
3662df4d28bfSStefano Zampini         PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
3663a3df083aSStefano Zampini 
3664a3df083aSStefano Zampini         ierr = MatDenseGetArray(local_auxmat2_R,&marr);CHKERRQ(ierr);
36655cbda25cSStefano Zampini         if (lda_rhs != n_R) {
36665cbda25cSStefano Zampini           for (i=0;i<n_constraints;i++) {
36675cbda25cSStefano Zampini             ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr);
36685cbda25cSStefano Zampini             ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr);
36695cbda25cSStefano Zampini             ierr = VecResetArray(dummy_vec);CHKERRQ(ierr);
36705cbda25cSStefano Zampini           }
36715cbda25cSStefano Zampini         } else {
3672a3df083aSStefano Zampini           for (i=0;i<n_constraints;i++) {
3673a3df083aSStefano Zampini             ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr);
36745cbda25cSStefano Zampini             ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr);
3675a3df083aSStefano Zampini             ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
3676a3df083aSStefano Zampini           }
36775cbda25cSStefano Zampini         }
3678a3df083aSStefano Zampini         ierr = MatDenseRestoreArray(local_auxmat2_R,&marr);CHKERRQ(ierr);
3679a3df083aSStefano Zampini       }
368006656605SStefano Zampini     } else {
368180677318SStefano Zampini       PetscScalar *marr;
368280677318SStefano Zampini 
368380677318SStefano Zampini       ierr = MatDenseGetArray(local_auxmat2_R,&marr);CHKERRQ(ierr);
368406656605SStefano Zampini       for (i=0;i<n_constraints;i++) {
3685ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec1_R,work+i*lda_rhs);CHKERRQ(ierr);
3686ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec2_R,marr+i*lda_rhs);CHKERRQ(ierr);
368706656605SStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
368806656605SStefano Zampini         ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
368906656605SStefano Zampini         ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr);
369006656605SStefano Zampini       }
369180677318SStefano Zampini       ierr = MatDenseRestoreArray(local_auxmat2_R,&marr);CHKERRQ(ierr);
369206656605SStefano Zampini     }
3693c58f9fdbSStefano Zampini     if (sparserhs) {
3694c58f9fdbSStefano Zampini       ierr = MatScale(C_CR,-1.0);CHKERRQ(ierr);
3695c58f9fdbSStefano Zampini     }
3696c58f9fdbSStefano Zampini     ierr = MatDestroy(&Brhs);CHKERRQ(ierr);
369780677318SStefano Zampini     if (!pcbddc->switch_static) {
369880677318SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,n_constraints,NULL,&pcbddc->local_auxmat2);CHKERRQ(ierr);
369980677318SStefano Zampini       ierr = MatDenseGetArray(pcbddc->local_auxmat2,&array);CHKERRQ(ierr);
370080677318SStefano Zampini       ierr = MatDenseGetArray(local_auxmat2_R,&array2);CHKERRQ(ierr);
370180677318SStefano Zampini       for (i=0;i<n_constraints;i++) {
3702ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec1_R,array2+i*lda_rhs);CHKERRQ(ierr);
370380677318SStefano Zampini         ierr = VecPlaceArray(pcis->vec1_B,array+i*n_B);CHKERRQ(ierr);
370480677318SStefano Zampini         ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
370580677318SStefano Zampini         ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
370680677318SStefano Zampini         ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr);
370780677318SStefano Zampini         ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
370880677318SStefano Zampini       }
370980677318SStefano Zampini       ierr = MatDenseRestoreArray(local_auxmat2_R,&array2);CHKERRQ(ierr);
371080677318SStefano Zampini       ierr = MatDenseRestoreArray(pcbddc->local_auxmat2,&array);CHKERRQ(ierr);
371172b8c272SStefano Zampini       ierr = MatMatMult(C_B,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&M3);CHKERRQ(ierr);
371280677318SStefano Zampini     } else {
3713ffd830a3SStefano Zampini       if (lda_rhs != n_R) {
3714ffd830a3SStefano Zampini         IS dummy;
3715ffd830a3SStefano Zampini 
3716ffd830a3SStefano Zampini         ierr = ISCreateStride(PETSC_COMM_SELF,n_R,0,1,&dummy);CHKERRQ(ierr);
37177dae84e0SHong Zhang         ierr = MatCreateSubMatrix(local_auxmat2_R,dummy,NULL,MAT_INITIAL_MATRIX,&pcbddc->local_auxmat2);CHKERRQ(ierr);
3718ffd830a3SStefano Zampini         ierr = ISDestroy(&dummy);CHKERRQ(ierr);
3719ffd830a3SStefano Zampini       } else {
372080677318SStefano Zampini         ierr = PetscObjectReference((PetscObject)local_auxmat2_R);CHKERRQ(ierr);
372180677318SStefano Zampini         pcbddc->local_auxmat2 = local_auxmat2_R;
3722ffd830a3SStefano Zampini       }
372325084f0cSStefano Zampini       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&M3);CHKERRQ(ierr);
372480677318SStefano Zampini     }
372580677318SStefano Zampini     ierr = ISDestroy(&is_aux);CHKERRQ(ierr);
372680677318SStefano Zampini     /* Assemble explicitly S_CC = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1}  */
372780677318SStefano Zampini     ierr = MatScale(M3,m_one);CHKERRQ(ierr);
372806656605SStefano Zampini     ierr = MatDuplicate(M3,MAT_DO_NOT_COPY_VALUES,&M1);CHKERRQ(ierr);
372906656605SStefano Zampini     ierr = MatDuplicate(M3,MAT_DO_NOT_COPY_VALUES,&M2);CHKERRQ(ierr);
373080677318SStefano Zampini     if (isCHOL) {
373180677318SStefano Zampini       ierr = MatCholeskyFactor(M3,NULL,NULL);CHKERRQ(ierr);
373280677318SStefano Zampini     } else {
373325084f0cSStefano Zampini       ierr = MatLUFactor(M3,NULL,NULL,NULL);CHKERRQ(ierr);
373480677318SStefano Zampini     }
373580677318SStefano Zampini     ierr = VecSet(pcbddc->vec1_C,one);CHKERRQ(ierr);
373606656605SStefano Zampini     ierr = MatDiagonalSet(M2,pcbddc->vec1_C,INSERT_VALUES);CHKERRQ(ierr);
373725084f0cSStefano Zampini     ierr = MatMatSolve(M3,M2,M1);CHKERRQ(ierr);
373825084f0cSStefano Zampini     ierr = MatDestroy(&M2);CHKERRQ(ierr);
373925084f0cSStefano Zampini     ierr = MatDestroy(&M3);CHKERRQ(ierr);
374080677318SStefano Zampini     /* Assemble local_auxmat1 = S_CC*C_{CB} needed by BDDC application in KSP and in preproc */
374172b8c272SStefano Zampini     ierr = MatMatMult(M1,C_B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
374272b8c272SStefano Zampini     ierr = MatDestroy(&C_B);CHKERRQ(ierr);
374306656605SStefano Zampini     ierr = MatCopy(M1,S_CC,SAME_NONZERO_PATTERN);CHKERRQ(ierr); /* S_CC can have a different LDA, MatMatSolve doesn't support it */
374406656605SStefano Zampini     ierr = MatDestroy(&M1);CHKERRQ(ierr);
3745f4ddd8eeSStefano Zampini   }
3746fc227af8SStefano Zampini 
3747fc227af8SStefano Zampini   /* Get submatrices from subdomain matrix */
374888ebb749SStefano Zampini   if (n_vertices) {
374906656605SStefano Zampini     IS        is_aux;
3750c58f9fdbSStefano Zampini     PetscBool isseqaij;
37513a50541eSStefano Zampini 
3752b334f244SStefano Zampini     if (sub_schurs && sub_schurs->reuse_solver) { /* is_R_local is not sorted, ISComplement doesn't like it */
37536816873aSStefano Zampini       IS tis;
37546816873aSStefano Zampini 
37556816873aSStefano Zampini       ierr = ISDuplicate(pcbddc->is_R_local,&tis);CHKERRQ(ierr);
37566816873aSStefano Zampini       ierr = ISSort(tis);CHKERRQ(ierr);
37576816873aSStefano Zampini       ierr = ISComplement(tis,0,pcis->n,&is_aux);CHKERRQ(ierr);
37586816873aSStefano Zampini       ierr = ISDestroy(&tis);CHKERRQ(ierr);
37596816873aSStefano Zampini     } else {
37603a50541eSStefano Zampini       ierr = ISComplement(pcbddc->is_R_local,0,pcis->n,&is_aux);CHKERRQ(ierr);
37616816873aSStefano Zampini     }
37627dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,is_aux,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
37637dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->local_mat,is_aux,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3764c58f9fdbSStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)A_VR,MATSEQAIJ,&isseqaij);CHKERRQ(ierr);
3765c58f9fdbSStefano Zampini     if (!isseqaij) { /* MatMatMult(A_VR,A_RRmA_RV) below will raise an error */
3766c58f9fdbSStefano Zampini       ierr = MatConvert(A_VR,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_VR);CHKERRQ(ierr);
3767c58f9fdbSStefano Zampini     }
37687dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->local_mat,is_aux,is_aux,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
376925084f0cSStefano Zampini     ierr = ISDestroy(&is_aux);CHKERRQ(ierr);
377088ebb749SStefano Zampini   }
377188ebb749SStefano Zampini 
377288ebb749SStefano Zampini   /* Matrix of coarse basis functions (local) */
3773f4ddd8eeSStefano Zampini   if (pcbddc->coarse_phi_B) {
377406656605SStefano Zampini     PetscInt on_B,on_primal,on_D=n_D;
377506656605SStefano Zampini     if (pcbddc->coarse_phi_D) {
377606656605SStefano Zampini       ierr = MatGetSize(pcbddc->coarse_phi_D,&on_D,NULL);CHKERRQ(ierr);
377706656605SStefano Zampini     }
3778f4ddd8eeSStefano Zampini     ierr = MatGetSize(pcbddc->coarse_phi_B,&on_B,&on_primal);CHKERRQ(ierr);
377906656605SStefano Zampini     if (on_B != n_B || on_primal != pcbddc->local_primal_size || on_D != n_D) {
378006656605SStefano Zampini       PetscScalar *marray;
378106656605SStefano Zampini 
378206656605SStefano Zampini       ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&marray);CHKERRQ(ierr);
378306656605SStefano Zampini       ierr = PetscFree(marray);CHKERRQ(ierr);
3784f4ddd8eeSStefano Zampini       ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
3785f4ddd8eeSStefano Zampini       ierr = MatDestroy(&pcbddc->coarse_psi_B);CHKERRQ(ierr);
3786f4ddd8eeSStefano Zampini       ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
3787f4ddd8eeSStefano Zampini       ierr = MatDestroy(&pcbddc->coarse_psi_D);CHKERRQ(ierr);
3788f4ddd8eeSStefano Zampini     }
3789f4ddd8eeSStefano Zampini   }
379006656605SStefano Zampini 
3791f4ddd8eeSStefano Zampini   if (!pcbddc->coarse_phi_B) {
3792a6e023c1Sstefano_zampini     PetscScalar *marr;
379388ebb749SStefano Zampini 
3794a6e023c1Sstefano_zampini     /* memory size */
379506656605SStefano Zampini     n = n_B*pcbddc->local_primal_size;
3796a6e023c1Sstefano_zampini     if (pcbddc->switch_static || pcbddc->dbg_flag) n += n_D*pcbddc->local_primal_size;
3797a6e023c1Sstefano_zampini     if (!pcbddc->symmetric_primal) n *= 2;
3798a6e023c1Sstefano_zampini     ierr  = PetscCalloc1(n,&marr);CHKERRQ(ierr);
3799a6e023c1Sstefano_zampini     ierr  = MatCreateSeqDense(PETSC_COMM_SELF,n_B,pcbddc->local_primal_size,marr,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
3800a6e023c1Sstefano_zampini     marr += n_B*pcbddc->local_primal_size;
38018eeda7d8SStefano Zampini     if (pcbddc->switch_static || pcbddc->dbg_flag) {
3802a6e023c1Sstefano_zampini       ierr  = MatCreateSeqDense(PETSC_COMM_SELF,n_D,pcbddc->local_primal_size,marr,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
3803a6e023c1Sstefano_zampini       marr += n_D*pcbddc->local_primal_size;
380488ebb749SStefano Zampini     }
38053301b35fSStefano Zampini     if (!pcbddc->symmetric_primal) {
3806a6e023c1Sstefano_zampini       ierr  = MatCreateSeqDense(PETSC_COMM_SELF,n_B,pcbddc->local_primal_size,marr,&pcbddc->coarse_psi_B);CHKERRQ(ierr);
3807a6e023c1Sstefano_zampini       marr += n_B*pcbddc->local_primal_size;
38088eeda7d8SStefano Zampini       if (pcbddc->switch_static || pcbddc->dbg_flag) {
3809a6e023c1Sstefano_zampini         ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_D,pcbddc->local_primal_size,marr,&pcbddc->coarse_psi_D);CHKERRQ(ierr);
381088ebb749SStefano Zampini       }
381188ebb749SStefano Zampini     } else {
3812c0553b1fSStefano Zampini       ierr = PetscObjectReference((PetscObject)pcbddc->coarse_phi_B);CHKERRQ(ierr);
3813c0553b1fSStefano Zampini       pcbddc->coarse_psi_B = pcbddc->coarse_phi_B;
38141b968477SStefano Zampini       if (pcbddc->switch_static || pcbddc->dbg_flag) {
3815c0553b1fSStefano Zampini         ierr = PetscObjectReference((PetscObject)pcbddc->coarse_phi_D);CHKERRQ(ierr);
3816c0553b1fSStefano Zampini         pcbddc->coarse_psi_D = pcbddc->coarse_phi_D;
3817c0553b1fSStefano Zampini       }
381888ebb749SStefano Zampini     }
381906656605SStefano Zampini   }
3820019a44ceSStefano Zampini 
382106656605SStefano Zampini   /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
38224f1b2e48SStefano Zampini   p0_lidx_I = NULL;
38234f1b2e48SStefano Zampini   if (pcbddc->benign_n && (pcbddc->switch_static || pcbddc->dbg_flag)) {
3824d12edf2fSStefano Zampini     const PetscInt *idxs;
3825d12edf2fSStefano Zampini 
3826d12edf2fSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,&idxs);CHKERRQ(ierr);
38274f1b2e48SStefano Zampini     ierr = PetscMalloc1(pcbddc->benign_n,&p0_lidx_I);CHKERRQ(ierr);
38284f1b2e48SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) {
38294f1b2e48SStefano Zampini       ierr = PetscFindInt(pcbddc->benign_p0_lidx[i],pcis->n-pcis->n_B,idxs,&p0_lidx_I[i]);CHKERRQ(ierr);
38304f1b2e48SStefano Zampini     }
3831d12edf2fSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,&idxs);CHKERRQ(ierr);
3832d12edf2fSStefano Zampini   }
3833d16cbb6bSStefano Zampini 
383406656605SStefano Zampini   /* vertices */
383506656605SStefano Zampini   if (n_vertices) {
3836c58f9fdbSStefano Zampini     PetscBool restoreavr = PETSC_FALSE;
383716f15bc4SStefano Zampini 
3838af25d912SStefano Zampini     ierr = MatConvert(A_VV,MATDENSE,MAT_INPLACE_MATRIX,&A_VV);CHKERRQ(ierr);
383904708bb6SStefano Zampini 
384016f15bc4SStefano Zampini     if (n_R) {
384114393ed6SStefano Zampini       Mat          A_RRmA_RV,A_RV_bcorr=NULL,S_VVt; /* S_VVt with LDA=N */
384206656605SStefano Zampini       PetscBLASInt B_N,B_one = 1;
384316f15bc4SStefano Zampini       PetscScalar  *x,*y;
384406656605SStefano Zampini 
384521eccb56SStefano Zampini       ierr = MatScale(A_RV,m_one);CHKERRQ(ierr);
384614393ed6SStefano Zampini       if (need_benign_correction) {
384714393ed6SStefano Zampini         ISLocalToGlobalMapping RtoN;
384814393ed6SStefano Zampini         IS                     is_p0;
384914393ed6SStefano Zampini         PetscInt               *idxs_p0,n;
385014393ed6SStefano Zampini 
385114393ed6SStefano Zampini         ierr = PetscMalloc1(pcbddc->benign_n,&idxs_p0);CHKERRQ(ierr);
385214393ed6SStefano Zampini         ierr = ISLocalToGlobalMappingCreateIS(pcbddc->is_R_local,&RtoN);CHKERRQ(ierr);
385314393ed6SStefano Zampini         ierr = ISGlobalToLocalMappingApply(RtoN,IS_GTOLM_DROP,pcbddc->benign_n,pcbddc->benign_p0_lidx,&n,idxs_p0);CHKERRQ(ierr);
3854af25d912SStefano Zampini         if (n != pcbddc->benign_n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in R numbering for benign p0! %d != %d\n",n,pcbddc->benign_n);
385514393ed6SStefano Zampini         ierr = ISLocalToGlobalMappingDestroy(&RtoN);CHKERRQ(ierr);
385614393ed6SStefano Zampini         ierr = ISCreateGeneral(PETSC_COMM_SELF,n,idxs_p0,PETSC_OWN_POINTER,&is_p0);CHKERRQ(ierr);
38577dae84e0SHong Zhang         ierr = MatCreateSubMatrix(A_RV,is_p0,NULL,MAT_INITIAL_MATRIX,&A_RV_bcorr);CHKERRQ(ierr);
385814393ed6SStefano Zampini         ierr = ISDestroy(&is_p0);CHKERRQ(ierr);
385914393ed6SStefano Zampini       }
386014393ed6SStefano Zampini 
3861c58f9fdbSStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,work,&A_RRmA_RV);CHKERRQ(ierr);
3862c58f9fdbSStefano Zampini       if (!sparserhs || need_benign_correction) {
3863ffd830a3SStefano Zampini         if (lda_rhs == n_R) {
3864af25d912SStefano Zampini           ierr = MatConvert(A_RV,MATDENSE,MAT_INPLACE_MATRIX,&A_RV);CHKERRQ(ierr);
3865ffd830a3SStefano Zampini         } else {
3866ca92afb2SStefano Zampini           PetscScalar    *av,*array;
3867ca92afb2SStefano Zampini           const PetscInt *xadj,*adjncy;
3868ca92afb2SStefano Zampini           PetscInt       n;
3869ca92afb2SStefano Zampini           PetscBool      flg_row;
3870ffd830a3SStefano Zampini 
3871ca92afb2SStefano Zampini           array = work+lda_rhs*n_vertices;
3872ca92afb2SStefano Zampini           ierr = PetscMemzero(array,lda_rhs*n_vertices*sizeof(PetscScalar));CHKERRQ(ierr);
38739d54b7f4SStefano Zampini           ierr = MatConvert(A_RV,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_RV);CHKERRQ(ierr);
3874ca92afb2SStefano Zampini           ierr = MatGetRowIJ(A_RV,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
3875ca92afb2SStefano Zampini           ierr = MatSeqAIJGetArray(A_RV,&av);CHKERRQ(ierr);
3876ca92afb2SStefano Zampini           for (i=0;i<n;i++) {
3877ca92afb2SStefano Zampini             PetscInt j;
3878ca92afb2SStefano Zampini             for (j=xadj[i];j<xadj[i+1];j++) array[lda_rhs*adjncy[j]+i] = av[j];
3879ffd830a3SStefano Zampini           }
3880ca92afb2SStefano Zampini           ierr = MatRestoreRowIJ(A_RV,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
3881ca92afb2SStefano Zampini           ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
3882ca92afb2SStefano Zampini           ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,array,&A_RV);CHKERRQ(ierr);
3883ffd830a3SStefano Zampini         }
3884a3df083aSStefano Zampini         if (need_benign_correction) {
3885df4d28bfSStefano Zampini           PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
3886a3df083aSStefano Zampini           PetscScalar        *marr;
3887a3df083aSStefano Zampini 
3888a3df083aSStefano Zampini           ierr = MatDenseGetArray(A_RV,&marr);CHKERRQ(ierr);
388914393ed6SStefano Zampini           /* need \Phi^T A_RV = (I+L)A_RV, L given by
389014393ed6SStefano Zampini 
389114393ed6SStefano Zampini                  | 0 0  0 | (V)
389214393ed6SStefano Zampini              L = | 0 0 -1 | (P-p0)
389314393ed6SStefano Zampini                  | 0 0 -1 | (p0)
389414393ed6SStefano Zampini 
389514393ed6SStefano Zampini           */
3896df4d28bfSStefano Zampini           for (i=0;i<reuse_solver->benign_n;i++) {
389714393ed6SStefano Zampini             const PetscScalar *vals;
389814393ed6SStefano Zampini             const PetscInt    *idxs,*idxs_zero;
389914393ed6SStefano Zampini             PetscInt          n,j,nz;
390014393ed6SStefano Zampini 
3901df4d28bfSStefano Zampini             ierr = ISGetLocalSize(reuse_solver->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr);
3902df4d28bfSStefano Zampini             ierr = ISGetIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr);
390314393ed6SStefano Zampini             ierr = MatGetRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr);
390414393ed6SStefano Zampini             for (j=0;j<n;j++) {
390514393ed6SStefano Zampini               PetscScalar val = vals[j];
390614393ed6SStefano Zampini               PetscInt    k,col = idxs[j];
390714393ed6SStefano Zampini               for (k=0;k<nz;k++) marr[idxs_zero[k]+lda_rhs*col] -= val;
390814393ed6SStefano Zampini             }
390914393ed6SStefano Zampini             ierr = MatRestoreRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr);
3910df4d28bfSStefano Zampini             ierr = ISRestoreIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr);
391114393ed6SStefano Zampini           }
391272b8c272SStefano Zampini           ierr = MatDenseRestoreArray(A_RV,&marr);CHKERRQ(ierr);
391372b8c272SStefano Zampini         }
3914c58f9fdbSStefano Zampini         ierr = PetscObjectReference((PetscObject)A_RV);CHKERRQ(ierr);
3915c58f9fdbSStefano Zampini         Brhs = A_RV;
3916c58f9fdbSStefano Zampini       } else {
3917c58f9fdbSStefano Zampini         Mat tA_RVT,A_RVT;
3918c58f9fdbSStefano Zampini 
3919c58f9fdbSStefano Zampini         if (!pcbddc->symmetric_primal) {
3920c58f9fdbSStefano Zampini           ierr = MatTranspose(A_RV,MAT_INITIAL_MATRIX,&A_RVT);CHKERRQ(ierr);
3921c58f9fdbSStefano Zampini         } else {
3922c58f9fdbSStefano Zampini           restoreavr = PETSC_TRUE;
3923c58f9fdbSStefano Zampini           ierr  = MatScale(A_VR,-1.0);CHKERRQ(ierr);
3924c58f9fdbSStefano Zampini           ierr  = PetscObjectReference((PetscObject)A_VR);CHKERRQ(ierr);
3925c58f9fdbSStefano Zampini           A_RVT = A_VR;
3926c58f9fdbSStefano Zampini         }
3927c58f9fdbSStefano Zampini         if (lda_rhs != n_R) {
3928c58f9fdbSStefano Zampini           PetscScalar *aa;
3929c58f9fdbSStefano Zampini           PetscInt    r,*ii,*jj;
3930c58f9fdbSStefano Zampini           PetscBool   done;
3931c58f9fdbSStefano Zampini 
3932c58f9fdbSStefano Zampini           ierr = MatGetRowIJ(A_RVT,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
393313903a91SSatish Balay           if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"GetRowIJ failed");
3934c58f9fdbSStefano Zampini           ierr = MatSeqAIJGetArray(A_RVT,&aa);CHKERRQ(ierr);
3935c58f9fdbSStefano Zampini           ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,n_vertices,lda_rhs,ii,jj,aa,&tA_RVT);CHKERRQ(ierr);
3936c58f9fdbSStefano Zampini           ierr = MatRestoreRowIJ(A_RVT,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
393713903a91SSatish Balay           if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"RestoreRowIJ failed");
3938c58f9fdbSStefano Zampini         } else {
3939c58f9fdbSStefano Zampini           ierr   = PetscObjectReference((PetscObject)A_RVT);CHKERRQ(ierr);
3940c58f9fdbSStefano Zampini           tA_RVT = A_RVT;
3941c58f9fdbSStefano Zampini         }
3942c58f9fdbSStefano Zampini         ierr = MatCreateTranspose(tA_RVT,&Brhs);CHKERRQ(ierr);
3943c58f9fdbSStefano Zampini         ierr = MatDestroy(&tA_RVT);CHKERRQ(ierr);
3944c58f9fdbSStefano Zampini         ierr = MatDestroy(&A_RVT);CHKERRQ(ierr);
3945c58f9fdbSStefano Zampini       }
394672b8c272SStefano Zampini       if (F) {
394714393ed6SStefano Zampini         /* need to correct the rhs */
394872b8c272SStefano Zampini         if (need_benign_correction) {
394972b8c272SStefano Zampini           PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
395072b8c272SStefano Zampini           PetscScalar        *marr;
395172b8c272SStefano Zampini 
3952c58f9fdbSStefano Zampini           ierr = MatDenseGetArray(Brhs,&marr);CHKERRQ(ierr);
39535cbda25cSStefano Zampini           if (lda_rhs != n_R) {
39545cbda25cSStefano Zampini             for (i=0;i<n_vertices;i++) {
39555cbda25cSStefano Zampini               ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr);
39565cbda25cSStefano Zampini               ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr);
39575cbda25cSStefano Zampini               ierr = VecResetArray(dummy_vec);CHKERRQ(ierr);
39585cbda25cSStefano Zampini             }
39595cbda25cSStefano Zampini           } else {
3960a3df083aSStefano Zampini             for (i=0;i<n_vertices;i++) {
3961a3df083aSStefano Zampini               ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr);
39625cbda25cSStefano Zampini               ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr);
3963a3df083aSStefano Zampini               ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
3964a3df083aSStefano Zampini             }
39655cbda25cSStefano Zampini           }
3966c58f9fdbSStefano Zampini           ierr = MatDenseRestoreArray(Brhs,&marr);CHKERRQ(ierr);
3967a3df083aSStefano Zampini         }
3968c58f9fdbSStefano Zampini         ierr = MatMatSolve(F,Brhs,A_RRmA_RV);CHKERRQ(ierr);
3969c58f9fdbSStefano Zampini         if (restoreavr) {
3970c58f9fdbSStefano Zampini           ierr = MatScale(A_VR,-1.0);CHKERRQ(ierr);
3971c58f9fdbSStefano Zampini         }
397214393ed6SStefano Zampini         /* need to correct the solution */
3973a3df083aSStefano Zampini         if (need_benign_correction) {
3974df4d28bfSStefano Zampini           PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
3975a3df083aSStefano Zampini           PetscScalar        *marr;
3976a3df083aSStefano Zampini 
3977a3df083aSStefano Zampini           ierr = MatDenseGetArray(A_RRmA_RV,&marr);CHKERRQ(ierr);
39785cbda25cSStefano Zampini           if (lda_rhs != n_R) {
39795cbda25cSStefano Zampini             for (i=0;i<n_vertices;i++) {
39805cbda25cSStefano Zampini               ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr);
39815cbda25cSStefano Zampini               ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr);
39825cbda25cSStefano Zampini               ierr = VecResetArray(dummy_vec);CHKERRQ(ierr);
39835cbda25cSStefano Zampini             }
39845cbda25cSStefano Zampini           } else {
3985a3df083aSStefano Zampini             for (i=0;i<n_vertices;i++) {
3986a3df083aSStefano Zampini               ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr);
39875cbda25cSStefano Zampini               ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr);
3988a3df083aSStefano Zampini               ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
3989a3df083aSStefano Zampini             }
39905cbda25cSStefano Zampini           }
3991a3df083aSStefano Zampini           ierr = MatDenseRestoreArray(A_RRmA_RV,&marr);CHKERRQ(ierr);
3992a3df083aSStefano Zampini         }
399306656605SStefano Zampini       } else {
3994c58f9fdbSStefano Zampini         ierr = MatDenseGetArray(Brhs,&y);CHKERRQ(ierr);
399506656605SStefano Zampini         for (i=0;i<n_vertices;i++) {
3996ffd830a3SStefano Zampini           ierr = VecPlaceArray(pcbddc->vec1_R,y+i*lda_rhs);CHKERRQ(ierr);
3997ffd830a3SStefano Zampini           ierr = VecPlaceArray(pcbddc->vec2_R,work+i*lda_rhs);CHKERRQ(ierr);
399806656605SStefano Zampini           ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
399906656605SStefano Zampini           ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
400006656605SStefano Zampini           ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr);
400106656605SStefano Zampini         }
4002c58f9fdbSStefano Zampini         ierr = MatDenseRestoreArray(Brhs,&y);CHKERRQ(ierr);
400306656605SStefano Zampini       }
400480677318SStefano Zampini       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
4005c58f9fdbSStefano Zampini       ierr = MatDestroy(&Brhs);CHKERRQ(ierr);
4006ffd830a3SStefano Zampini       /* S_VV and S_CV */
400706656605SStefano Zampini       if (n_constraints) {
400806656605SStefano Zampini         Mat B;
400980677318SStefano Zampini 
4010ffd830a3SStefano Zampini         ierr = PetscMemzero(work+lda_rhs*n_vertices,n_B*n_vertices*sizeof(PetscScalar));CHKERRQ(ierr);
401180677318SStefano Zampini         for (i=0;i<n_vertices;i++) {
4012ffd830a3SStefano Zampini           ierr = VecPlaceArray(pcbddc->vec1_R,work+i*lda_rhs);CHKERRQ(ierr);
4013ffd830a3SStefano Zampini           ierr = VecPlaceArray(pcis->vec1_B,work+lda_rhs*n_vertices+i*n_B);CHKERRQ(ierr);
401480677318SStefano Zampini           ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
401580677318SStefano Zampini           ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
401680677318SStefano Zampini           ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr);
401780677318SStefano Zampini           ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
401880677318SStefano Zampini         }
4019ffd830a3SStefano Zampini         ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,n_vertices,work+lda_rhs*n_vertices,&B);CHKERRQ(ierr);
402080677318SStefano Zampini         ierr = MatMatMult(pcbddc->local_auxmat1,B,MAT_REUSE_MATRIX,PETSC_DEFAULT,&S_CV);CHKERRQ(ierr);
402180677318SStefano Zampini         ierr = MatDestroy(&B);CHKERRQ(ierr);
4022ffd830a3SStefano Zampini         ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,work+lda_rhs*n_vertices,&B);CHKERRQ(ierr);
402380677318SStefano Zampini         ierr = MatMatMult(local_auxmat2_R,S_CV,MAT_REUSE_MATRIX,PETSC_DEFAULT,&B);CHKERRQ(ierr);
402406656605SStefano Zampini         ierr = MatScale(S_CV,m_one);CHKERRQ(ierr);
4025ffd830a3SStefano Zampini         ierr = PetscBLASIntCast(lda_rhs*n_vertices,&B_N);CHKERRQ(ierr);
4026ffd830a3SStefano Zampini         PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&B_N,&one,work+lda_rhs*n_vertices,&B_one,work,&B_one));
402706656605SStefano Zampini         ierr = MatDestroy(&B);CHKERRQ(ierr);
402806656605SStefano Zampini       }
4029ffd830a3SStefano Zampini       if (lda_rhs != n_R) {
4030ffd830a3SStefano Zampini         ierr = MatDestroy(&A_RRmA_RV);CHKERRQ(ierr);
4031ffd830a3SStefano Zampini         ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_vertices,work,&A_RRmA_RV);CHKERRQ(ierr);
4032ffd830a3SStefano Zampini         ierr = MatSeqDenseSetLDA(A_RRmA_RV,lda_rhs);CHKERRQ(ierr);
4033ffd830a3SStefano Zampini       }
403406656605SStefano Zampini       ierr = MatMatMult(A_VR,A_RRmA_RV,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&S_VVt);CHKERRQ(ierr);
403514393ed6SStefano Zampini       /* need A_VR * \Phi * A_RRmA_RV = A_VR * (I+L)^T * A_RRmA_RV, L given as before */
403614393ed6SStefano Zampini       if (need_benign_correction) {
4037df4d28bfSStefano Zampini         PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
403814393ed6SStefano Zampini         PetscScalar      *marr,*sums;
403914393ed6SStefano Zampini 
404014393ed6SStefano Zampini         ierr = PetscMalloc1(n_vertices,&sums);CHKERRQ(ierr);
4041f913dca9SStefano Zampini         ierr = MatDenseGetArray(S_VVt,&marr);CHKERRQ(ierr);
4042df4d28bfSStefano Zampini         for (i=0;i<reuse_solver->benign_n;i++) {
404314393ed6SStefano Zampini           const PetscScalar *vals;
404414393ed6SStefano Zampini           const PetscInt    *idxs,*idxs_zero;
404514393ed6SStefano Zampini           PetscInt          n,j,nz;
404614393ed6SStefano Zampini 
4047df4d28bfSStefano Zampini           ierr = ISGetLocalSize(reuse_solver->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr);
4048df4d28bfSStefano Zampini           ierr = ISGetIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr);
404914393ed6SStefano Zampini           for (j=0;j<n_vertices;j++) {
405014393ed6SStefano Zampini             PetscInt k;
405114393ed6SStefano Zampini             sums[j] = 0.;
405214393ed6SStefano Zampini             for (k=0;k<nz;k++) sums[j] += work[idxs_zero[k]+j*lda_rhs];
405314393ed6SStefano Zampini           }
405414393ed6SStefano Zampini           ierr = MatGetRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr);
405514393ed6SStefano Zampini           for (j=0;j<n;j++) {
405614393ed6SStefano Zampini             PetscScalar val = vals[j];
405714393ed6SStefano Zampini             PetscInt k;
405814393ed6SStefano Zampini             for (k=0;k<n_vertices;k++) {
405914393ed6SStefano Zampini               marr[idxs[j]+k*n_vertices] += val*sums[k];
406014393ed6SStefano Zampini             }
406114393ed6SStefano Zampini           }
406214393ed6SStefano Zampini           ierr = MatRestoreRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr);
4063df4d28bfSStefano Zampini           ierr = ISRestoreIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr);
406414393ed6SStefano Zampini         }
406514393ed6SStefano Zampini         ierr = PetscFree(sums);CHKERRQ(ierr);
4066f913dca9SStefano Zampini         ierr = MatDenseRestoreArray(S_VVt,&marr);CHKERRQ(ierr);
406714393ed6SStefano Zampini         ierr = MatDestroy(&A_RV_bcorr);CHKERRQ(ierr);
406814393ed6SStefano Zampini       }
406980677318SStefano Zampini       ierr = MatDestroy(&A_RRmA_RV);CHKERRQ(ierr);
407006656605SStefano Zampini       ierr = PetscBLASIntCast(n_vertices*n_vertices,&B_N);CHKERRQ(ierr);
407106656605SStefano Zampini       ierr = MatDenseGetArray(A_VV,&x);CHKERRQ(ierr);
407206656605SStefano Zampini       ierr = MatDenseGetArray(S_VVt,&y);CHKERRQ(ierr);
407306656605SStefano Zampini       PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&B_N,&one,x,&B_one,y,&B_one));
407406656605SStefano Zampini       ierr = MatDenseRestoreArray(A_VV,&x);CHKERRQ(ierr);
407506656605SStefano Zampini       ierr = MatDenseRestoreArray(S_VVt,&y);CHKERRQ(ierr);
407606656605SStefano Zampini       ierr = MatCopy(S_VVt,S_VV,SAME_NONZERO_PATTERN);CHKERRQ(ierr);
4077d16cbb6bSStefano Zampini       ierr = MatDestroy(&S_VVt);CHKERRQ(ierr);
4078019a44ceSStefano Zampini     } else {
4079d16cbb6bSStefano Zampini       ierr = MatCopy(A_VV,S_VV,SAME_NONZERO_PATTERN);CHKERRQ(ierr);
4080d16cbb6bSStefano Zampini     }
408121eccb56SStefano Zampini     ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
4082d16cbb6bSStefano Zampini 
408306656605SStefano Zampini     /* coarse basis functions */
408406656605SStefano Zampini     for (i=0;i<n_vertices;i++) {
408516f15bc4SStefano Zampini       PetscScalar *y;
408616f15bc4SStefano Zampini 
4087ffd830a3SStefano Zampini       ierr = VecPlaceArray(pcbddc->vec1_R,work+lda_rhs*i);CHKERRQ(ierr);
408806656605SStefano Zampini       ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr);
408906656605SStefano Zampini       ierr = VecPlaceArray(pcis->vec1_B,y+n_B*i);CHKERRQ(ierr);
409006656605SStefano Zampini       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
409106656605SStefano Zampini       ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
409206656605SStefano Zampini       y[n_B*i+idx_V_B[i]] = 1.0;
409306656605SStefano Zampini       ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr);
409406656605SStefano Zampini       ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr);
409506656605SStefano Zampini 
409606656605SStefano Zampini       if (pcbddc->switch_static || pcbddc->dbg_flag) {
40974f1b2e48SStefano Zampini         PetscInt j;
40984f1b2e48SStefano Zampini 
409906656605SStefano Zampini         ierr = MatDenseGetArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr);
410006656605SStefano Zampini         ierr = VecPlaceArray(pcis->vec1_D,y+n_D*i);CHKERRQ(ierr);
410106656605SStefano Zampini         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
410206656605SStefano Zampini         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
410306656605SStefano Zampini         ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr);
41044f1b2e48SStefano Zampini         for (j=0;j<pcbddc->benign_n;j++) y[n_D*i+p0_lidx_I[j]] = 0.0;
410506656605SStefano Zampini         ierr = MatDenseRestoreArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr);
410606656605SStefano Zampini       }
410706656605SStefano Zampini       ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
410806656605SStefano Zampini     }
410904708bb6SStefano Zampini     /* if n_R == 0 the object is not destroyed */
411004708bb6SStefano Zampini     ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
411106656605SStefano Zampini   }
41125cbda25cSStefano Zampini   ierr = VecDestroy(&dummy_vec);CHKERRQ(ierr);
411306656605SStefano Zampini 
411406656605SStefano Zampini   if (n_constraints) {
411506656605SStefano Zampini     Mat B;
411606656605SStefano Zampini 
4117ffd830a3SStefano Zampini     ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,work,&B);CHKERRQ(ierr);
411806656605SStefano Zampini     ierr = MatScale(S_CC,m_one);CHKERRQ(ierr);
411980677318SStefano Zampini     ierr = MatMatMult(local_auxmat2_R,S_CC,MAT_REUSE_MATRIX,PETSC_DEFAULT,&B);CHKERRQ(ierr);
412006656605SStefano Zampini     ierr = MatScale(S_CC,m_one);CHKERRQ(ierr);
412106656605SStefano Zampini     if (n_vertices) {
412280677318SStefano Zampini       if (isCHOL) { /* if we can solve the interior problem with cholesky, we should also be fine with transposing here */
412380677318SStefano Zampini         ierr = MatTranspose(S_CV,MAT_REUSE_MATRIX,&S_VC);CHKERRQ(ierr);
412480677318SStefano Zampini       } else {
412580677318SStefano Zampini         Mat S_VCt;
412680677318SStefano Zampini 
4127ffd830a3SStefano Zampini         if (lda_rhs != n_R) {
4128ffd830a3SStefano Zampini           ierr = MatDestroy(&B);CHKERRQ(ierr);
412972b8c272SStefano Zampini           ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_constraints,work,&B);CHKERRQ(ierr);
4130ffd830a3SStefano Zampini           ierr = MatSeqDenseSetLDA(B,lda_rhs);CHKERRQ(ierr);
4131ffd830a3SStefano Zampini         }
413280677318SStefano Zampini         ierr = MatMatMult(A_VR,B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&S_VCt);CHKERRQ(ierr);
413380677318SStefano Zampini         ierr = MatCopy(S_VCt,S_VC,SAME_NONZERO_PATTERN);CHKERRQ(ierr);
413480677318SStefano Zampini         ierr = MatDestroy(&S_VCt);CHKERRQ(ierr);
413580677318SStefano Zampini       }
413606656605SStefano Zampini     }
413706656605SStefano Zampini     ierr = MatDestroy(&B);CHKERRQ(ierr);
413806656605SStefano Zampini     /* coarse basis functions */
413906656605SStefano Zampini     for (i=0;i<n_constraints;i++) {
414006656605SStefano Zampini       PetscScalar *y;
414106656605SStefano Zampini 
4142ffd830a3SStefano Zampini       ierr = VecPlaceArray(pcbddc->vec1_R,work+lda_rhs*i);CHKERRQ(ierr);
414306656605SStefano Zampini       ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr);
414406656605SStefano Zampini       ierr = VecPlaceArray(pcis->vec1_B,y+n_B*(i+n_vertices));CHKERRQ(ierr);
414506656605SStefano Zampini       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
414606656605SStefano Zampini       ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
414706656605SStefano Zampini       ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr);
414806656605SStefano Zampini       ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr);
414906656605SStefano Zampini       if (pcbddc->switch_static || pcbddc->dbg_flag) {
41504f1b2e48SStefano Zampini         PetscInt j;
41514f1b2e48SStefano Zampini 
415206656605SStefano Zampini         ierr = MatDenseGetArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr);
415306656605SStefano Zampini         ierr = VecPlaceArray(pcis->vec1_D,y+n_D*(i+n_vertices));CHKERRQ(ierr);
415406656605SStefano Zampini         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
415506656605SStefano Zampini         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
415606656605SStefano Zampini         ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr);
41574f1b2e48SStefano Zampini         for (j=0;j<pcbddc->benign_n;j++) y[n_D*i+p0_lidx_I[j]] = 0.0;
415806656605SStefano Zampini         ierr = MatDenseRestoreArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr);
415906656605SStefano Zampini       }
416006656605SStefano Zampini       ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
416106656605SStefano Zampini     }
416206656605SStefano Zampini   }
416380677318SStefano Zampini   if (n_constraints) {
416480677318SStefano Zampini     ierr = MatDestroy(&local_auxmat2_R);CHKERRQ(ierr);
416580677318SStefano Zampini   }
41664f1b2e48SStefano Zampini   ierr = PetscFree(p0_lidx_I);CHKERRQ(ierr);
416772b8c272SStefano Zampini 
416872b8c272SStefano Zampini   /* coarse matrix entries relative to B_0 */
416972b8c272SStefano Zampini   if (pcbddc->benign_n) {
417072b8c272SStefano Zampini     Mat         B0_B,B0_BPHI;
417172b8c272SStefano Zampini     IS          is_dummy;
417272b8c272SStefano Zampini     PetscScalar *data;
417372b8c272SStefano Zampini     PetscInt    j;
417472b8c272SStefano Zampini 
417572b8c272SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr);
41767dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->benign_B0,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr);
417772b8c272SStefano Zampini     ierr = ISDestroy(&is_dummy);CHKERRQ(ierr);
417872b8c272SStefano Zampini     ierr = MatMatMult(B0_B,pcbddc->coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&B0_BPHI);CHKERRQ(ierr);
417986c38910SStefano Zampini     ierr = MatConvert(B0_BPHI,MATSEQDENSE,MAT_INPLACE_MATRIX,&B0_BPHI);CHKERRQ(ierr);
418072b8c272SStefano Zampini     ierr = MatDenseGetArray(B0_BPHI,&data);CHKERRQ(ierr);
418172b8c272SStefano Zampini     for (j=0;j<pcbddc->benign_n;j++) {
418272b8c272SStefano Zampini       PetscInt primal_idx = pcbddc->local_primal_size - pcbddc->benign_n + j;
418372b8c272SStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) {
418472b8c272SStefano Zampini         coarse_submat_vals[primal_idx*pcbddc->local_primal_size+i] = data[i*pcbddc->benign_n+j];
418572b8c272SStefano Zampini         coarse_submat_vals[i*pcbddc->local_primal_size+primal_idx] = data[i*pcbddc->benign_n+j];
418672b8c272SStefano Zampini       }
418772b8c272SStefano Zampini     }
418872b8c272SStefano Zampini     ierr = MatDenseRestoreArray(B0_BPHI,&data);CHKERRQ(ierr);
418972b8c272SStefano Zampini     ierr = MatDestroy(&B0_B);CHKERRQ(ierr);
419072b8c272SStefano Zampini     ierr = MatDestroy(&B0_BPHI);CHKERRQ(ierr);
419172b8c272SStefano Zampini   }
4192019a44ceSStefano Zampini 
419306656605SStefano Zampini   /* compute other basis functions for non-symmetric problems */
41943301b35fSStefano Zampini   if (!pcbddc->symmetric_primal) {
4195ffd830a3SStefano Zampini     Mat         B_V=NULL,B_C=NULL;
4196ffd830a3SStefano Zampini     PetscScalar *marray;
419706656605SStefano Zampini 
419806656605SStefano Zampini     if (n_constraints) {
4199ffd830a3SStefano Zampini       Mat S_CCT,C_CRT;
420006656605SStefano Zampini 
4201abc8f43dSstefano_zampini       ierr = MatTranspose(C_CR,MAT_INITIAL_MATRIX,&C_CRT);CHKERRQ(ierr);
420206656605SStefano Zampini       ierr = MatTranspose(S_CC,MAT_INITIAL_MATRIX,&S_CCT);CHKERRQ(ierr);
4203ffd830a3SStefano Zampini       ierr = MatMatMult(C_CRT,S_CCT,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&B_C);CHKERRQ(ierr);
420416f15bc4SStefano Zampini       ierr = MatDestroy(&S_CCT);CHKERRQ(ierr);
420506656605SStefano Zampini       if (n_vertices) {
4206ffd830a3SStefano Zampini         Mat S_VCT;
420706656605SStefano Zampini 
420806656605SStefano Zampini         ierr = MatTranspose(S_VC,MAT_INITIAL_MATRIX,&S_VCT);CHKERRQ(ierr);
4209ffd830a3SStefano Zampini         ierr = MatMatMult(C_CRT,S_VCT,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&B_V);CHKERRQ(ierr);
421016f15bc4SStefano Zampini         ierr = MatDestroy(&S_VCT);CHKERRQ(ierr);
421106656605SStefano Zampini       }
4212ffd830a3SStefano Zampini       ierr = MatDestroy(&C_CRT);CHKERRQ(ierr);
42135b782168SStefano Zampini     } else {
42145b782168SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_vertices,NULL,&B_V);CHKERRQ(ierr);
421506656605SStefano Zampini     }
421616f15bc4SStefano Zampini     if (n_vertices && n_R) {
4217ffd830a3SStefano Zampini       PetscScalar    *av,*marray;
4218ffd830a3SStefano Zampini       const PetscInt *xadj,*adjncy;
4219ffd830a3SStefano Zampini       PetscInt       n;
4220ffd830a3SStefano Zampini       PetscBool      flg_row;
422106656605SStefano Zampini 
4222ffd830a3SStefano Zampini       /* B_V = B_V - A_VR^T */
4223af25d912SStefano Zampini       ierr = MatConvert(A_VR,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_VR);CHKERRQ(ierr);
4224ffd830a3SStefano Zampini       ierr = MatGetRowIJ(A_VR,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
4225ffd830a3SStefano Zampini       ierr = MatSeqAIJGetArray(A_VR,&av);CHKERRQ(ierr);
4226ffd830a3SStefano Zampini       ierr = MatDenseGetArray(B_V,&marray);CHKERRQ(ierr);
4227ffd830a3SStefano Zampini       for (i=0;i<n;i++) {
4228ffd830a3SStefano Zampini         PetscInt j;
4229ffd830a3SStefano Zampini         for (j=xadj[i];j<xadj[i+1];j++) marray[i*n_R + adjncy[j]] -= av[j];
4230ffd830a3SStefano Zampini       }
4231ffd830a3SStefano Zampini       ierr = MatDenseRestoreArray(B_V,&marray);CHKERRQ(ierr);
4232ffd830a3SStefano Zampini       ierr = MatRestoreRowIJ(A_VR,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
4233ffd830a3SStefano Zampini       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
423406656605SStefano Zampini     }
423506656605SStefano Zampini 
4236ffd830a3SStefano Zampini     /* currently there's no support for MatTransposeMatSolve(F,B,X) */
4237abc8f43dSstefano_zampini     if (n_vertices) {
4238ffd830a3SStefano Zampini       ierr = MatDenseGetArray(B_V,&marray);CHKERRQ(ierr);
4239ffd830a3SStefano Zampini       for (i=0;i<n_vertices;i++) {
4240ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec1_R,marray+i*n_R);CHKERRQ(ierr);
4241ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec2_R,work+i*n_R);CHKERRQ(ierr);
424206656605SStefano Zampini         ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
424306656605SStefano Zampini         ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
424406656605SStefano Zampini         ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr);
424506656605SStefano Zampini       }
4246ffd830a3SStefano Zampini       ierr = MatDenseRestoreArray(B_V,&marray);CHKERRQ(ierr);
4247abc8f43dSstefano_zampini     }
42485b782168SStefano Zampini     if (B_C) {
4249ffd830a3SStefano Zampini       ierr = MatDenseGetArray(B_C,&marray);CHKERRQ(ierr);
4250ffd830a3SStefano Zampini       for (i=n_vertices;i<n_constraints+n_vertices;i++) {
4251ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec1_R,marray+(i-n_vertices)*n_R);CHKERRQ(ierr);
4252ffd830a3SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec2_R,work+i*n_R);CHKERRQ(ierr);
4253ffd830a3SStefano Zampini         ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
4254ffd830a3SStefano Zampini         ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
4255ffd830a3SStefano Zampini         ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr);
425606656605SStefano Zampini       }
4257ffd830a3SStefano Zampini       ierr = MatDenseRestoreArray(B_C,&marray);CHKERRQ(ierr);
42585b782168SStefano Zampini     }
425906656605SStefano Zampini     /* coarse basis functions */
426006656605SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
426106656605SStefano Zampini       PetscScalar *y;
426206656605SStefano Zampini 
4263ffd830a3SStefano Zampini       ierr = VecPlaceArray(pcbddc->vec1_R,work+i*n_R);CHKERRQ(ierr);
426406656605SStefano Zampini       ierr = MatDenseGetArray(pcbddc->coarse_psi_B,&y);CHKERRQ(ierr);
426506656605SStefano Zampini       ierr = VecPlaceArray(pcis->vec1_B,y+n_B*i);CHKERRQ(ierr);
426606656605SStefano Zampini       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
426706656605SStefano Zampini       ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
426806656605SStefano Zampini       if (i<n_vertices) {
426906656605SStefano Zampini         y[n_B*i+idx_V_B[i]] = 1.0;
427006656605SStefano Zampini       }
427106656605SStefano Zampini       ierr = MatDenseRestoreArray(pcbddc->coarse_psi_B,&y);CHKERRQ(ierr);
427206656605SStefano Zampini       ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr);
427306656605SStefano Zampini 
427406656605SStefano Zampini       if (pcbddc->switch_static || pcbddc->dbg_flag) {
427506656605SStefano Zampini         ierr = MatDenseGetArray(pcbddc->coarse_psi_D,&y);CHKERRQ(ierr);
427606656605SStefano Zampini         ierr = VecPlaceArray(pcis->vec1_D,y+n_D*i);CHKERRQ(ierr);
427706656605SStefano Zampini         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
427806656605SStefano Zampini         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
427906656605SStefano Zampini         ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr);
428006656605SStefano Zampini         ierr = MatDenseRestoreArray(pcbddc->coarse_psi_D,&y);CHKERRQ(ierr);
428106656605SStefano Zampini       }
428206656605SStefano Zampini       ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr);
428306656605SStefano Zampini     }
4284ffd830a3SStefano Zampini     ierr = MatDestroy(&B_V);CHKERRQ(ierr);
4285ffd830a3SStefano Zampini     ierr = MatDestroy(&B_C);CHKERRQ(ierr);
428606656605SStefano Zampini   }
4287a6e023c1Sstefano_zampini 
4288d62866d3SStefano Zampini   /* free memory */
428988ebb749SStefano Zampini   ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
429006656605SStefano Zampini   ierr = MatDestroy(&S_VV);CHKERRQ(ierr);
429106656605SStefano Zampini   ierr = MatDestroy(&S_CV);CHKERRQ(ierr);
429206656605SStefano Zampini   ierr = MatDestroy(&S_VC);CHKERRQ(ierr);
429306656605SStefano Zampini   ierr = MatDestroy(&S_CC);CHKERRQ(ierr);
4294d62866d3SStefano Zampini   ierr = PetscFree(work);CHKERRQ(ierr);
4295d62866d3SStefano Zampini   if (n_vertices) {
4296d62866d3SStefano Zampini     ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
4297d62866d3SStefano Zampini   }
4298d62866d3SStefano Zampini   if (n_constraints) {
4299d62866d3SStefano Zampini     ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
4300d62866d3SStefano Zampini   }
430188ebb749SStefano Zampini   /* Checking coarse_sub_mat and coarse basis functios */
430288ebb749SStefano Zampini   /* Symmetric case     : It should be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
430388ebb749SStefano Zampini   /* Non-symmetric case : It should be \Psi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
4304d12edf2fSStefano Zampini   if (pcbddc->dbg_flag) {
430588ebb749SStefano Zampini     Mat         coarse_sub_mat;
430625084f0cSStefano Zampini     Mat         AUXMAT,TM1,TM2,TM3,TM4;
430788ebb749SStefano Zampini     Mat         coarse_phi_D,coarse_phi_B;
430888ebb749SStefano Zampini     Mat         coarse_psi_D,coarse_psi_B;
430988ebb749SStefano Zampini     Mat         A_II,A_BB,A_IB,A_BI;
43108bec7fa6SStefano Zampini     Mat         C_B,CPHI;
43118bec7fa6SStefano Zampini     IS          is_dummy;
43128bec7fa6SStefano Zampini     Vec         mones;
431388ebb749SStefano Zampini     MatType     checkmattype=MATSEQAIJ;
431488ebb749SStefano Zampini     PetscReal   real_value;
431588ebb749SStefano Zampini 
4316a3df083aSStefano Zampini     if (pcbddc->benign_n && !pcbddc->benign_change_explicit) {
4317a3df083aSStefano Zampini       Mat A;
4318a3df083aSStefano Zampini       ierr = PCBDDCBenignProject(pc,NULL,NULL,&A);CHKERRQ(ierr);
43197dae84e0SHong Zhang       ierr = MatCreateSubMatrix(A,pcis->is_I_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
43207dae84e0SHong Zhang       ierr = MatCreateSubMatrix(A,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
43217dae84e0SHong Zhang       ierr = MatCreateSubMatrix(A,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
43227dae84e0SHong Zhang       ierr = MatCreateSubMatrix(A,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
4323a3df083aSStefano Zampini       ierr = MatDestroy(&A);CHKERRQ(ierr);
4324a3df083aSStefano Zampini     } else {
432588ebb749SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
432688ebb749SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
432788ebb749SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
432888ebb749SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
4329a3df083aSStefano Zampini     }
433088ebb749SStefano Zampini     ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
433188ebb749SStefano Zampini     ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
4332ffd830a3SStefano Zampini     if (!pcbddc->symmetric_primal) {
433388ebb749SStefano Zampini       ierr = MatConvert(pcbddc->coarse_psi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_D);CHKERRQ(ierr);
433488ebb749SStefano Zampini       ierr = MatConvert(pcbddc->coarse_psi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_B);CHKERRQ(ierr);
433588ebb749SStefano Zampini     }
433688ebb749SStefano Zampini     ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
433788ebb749SStefano Zampini 
433825084f0cSStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
43393301b35fSStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check coarse sub mat computation (symmetric %d)\n",pcbddc->symmetric_primal);CHKERRQ(ierr);
434025084f0cSStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
4341ffd830a3SStefano Zampini     if (!pcbddc->symmetric_primal) {
434288ebb749SStefano Zampini       ierr = MatMatMult(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
434388ebb749SStefano Zampini       ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
434488ebb749SStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
434588ebb749SStefano Zampini       ierr = MatMatMult(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
434688ebb749SStefano Zampini       ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
434788ebb749SStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
434888ebb749SStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
434988ebb749SStefano Zampini       ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
435088ebb749SStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
435188ebb749SStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
435288ebb749SStefano Zampini       ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
435388ebb749SStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
435488ebb749SStefano Zampini     } else {
435588ebb749SStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
435688ebb749SStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
435788ebb749SStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
435888ebb749SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
435988ebb749SStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
436088ebb749SStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
436188ebb749SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
436288ebb749SStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
436388ebb749SStefano Zampini     }
436488ebb749SStefano Zampini     ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
436588ebb749SStefano Zampini     ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
436688ebb749SStefano Zampini     ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
4367511c6705SHong Zhang     ierr = MatConvert(TM1,MATSEQDENSE,MAT_INPLACE_MATRIX,&TM1);CHKERRQ(ierr);
43684f1b2e48SStefano Zampini     if (pcbddc->benign_n) {
4369fc227af8SStefano Zampini       Mat         B0_B,B0_BPHI;
4370d12edf2fSStefano Zampini       PetscScalar *data,*data2;
43714f1b2e48SStefano Zampini       PetscInt    j;
4372d12edf2fSStefano Zampini 
43734f1b2e48SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr);
43747dae84e0SHong Zhang       ierr = MatCreateSubMatrix(pcbddc->benign_B0,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr);
4375d12edf2fSStefano Zampini       ierr = MatMatMult(B0_B,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&B0_BPHI);CHKERRQ(ierr);
437686c38910SStefano Zampini       ierr = MatConvert(B0_BPHI,MATSEQDENSE,MAT_INPLACE_MATRIX,&B0_BPHI);CHKERRQ(ierr);
4377d12edf2fSStefano Zampini       ierr = MatDenseGetArray(TM1,&data);CHKERRQ(ierr);
4378d12edf2fSStefano Zampini       ierr = MatDenseGetArray(B0_BPHI,&data2);CHKERRQ(ierr);
43794f1b2e48SStefano Zampini       for (j=0;j<pcbddc->benign_n;j++) {
43804f1b2e48SStefano Zampini         PetscInt primal_idx = pcbddc->local_primal_size - pcbddc->benign_n + j;
4381d12edf2fSStefano Zampini         for (i=0;i<pcbddc->local_primal_size;i++) {
43824f1b2e48SStefano Zampini           data[primal_idx*pcbddc->local_primal_size+i] += data2[i*pcbddc->benign_n+j];
43834f1b2e48SStefano Zampini           data[i*pcbddc->local_primal_size+primal_idx] += data2[i*pcbddc->benign_n+j];
43844f1b2e48SStefano Zampini         }
4385d12edf2fSStefano Zampini       }
4386d12edf2fSStefano Zampini       ierr = MatDenseRestoreArray(TM1,&data);CHKERRQ(ierr);
4387d12edf2fSStefano Zampini       ierr = MatDenseRestoreArray(B0_BPHI,&data2);CHKERRQ(ierr);
4388d12edf2fSStefano Zampini       ierr = MatDestroy(&B0_B);CHKERRQ(ierr);
4389d12edf2fSStefano Zampini       ierr = ISDestroy(&is_dummy);CHKERRQ(ierr);
4390d12edf2fSStefano Zampini       ierr = MatDestroy(&B0_BPHI);CHKERRQ(ierr);
4391d12edf2fSStefano Zampini     }
4392d12edf2fSStefano Zampini #if 0
4393d12edf2fSStefano Zampini   {
4394d12edf2fSStefano Zampini     PetscViewer viewer;
4395d12edf2fSStefano Zampini     char filename[256];
4396ffd830a3SStefano Zampini     sprintf(filename,"details_local_coarse_mat%d_level%d.m",PetscGlobalRank,pcbddc->current_level);
4397d12edf2fSStefano Zampini     ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&viewer);CHKERRQ(ierr);
4398d12edf2fSStefano Zampini     ierr = PetscViewerSetFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
4399ffd830a3SStefano Zampini     ierr = PetscObjectSetName((PetscObject)coarse_sub_mat,"computed");CHKERRQ(ierr);
4400ffd830a3SStefano Zampini     ierr = MatView(coarse_sub_mat,viewer);CHKERRQ(ierr);
4401ffd830a3SStefano Zampini     ierr = PetscObjectSetName((PetscObject)TM1,"projected");CHKERRQ(ierr);
4402d12edf2fSStefano Zampini     ierr = MatView(TM1,viewer);CHKERRQ(ierr);
440372b8c272SStefano Zampini     if (save_change) {
440472b8c272SStefano Zampini       Mat phi_B;
440572b8c272SStefano Zampini       ierr = MatMatMult(save_change,pcbddc->coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&phi_B);CHKERRQ(ierr);
440672b8c272SStefano Zampini       ierr = PetscObjectSetName((PetscObject)phi_B,"phi_B");CHKERRQ(ierr);
440772b8c272SStefano Zampini       ierr = MatView(phi_B,viewer);CHKERRQ(ierr);
440872b8c272SStefano Zampini       ierr = MatDestroy(&phi_B);CHKERRQ(ierr);
440972b8c272SStefano Zampini     } else {
4410ffd830a3SStefano Zampini       ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_phi_B,"phi_B");CHKERRQ(ierr);
4411ffd830a3SStefano Zampini       ierr = MatView(pcbddc->coarse_phi_B,viewer);CHKERRQ(ierr);
441272b8c272SStefano Zampini     }
4413ffd830a3SStefano Zampini     if (pcbddc->coarse_phi_D) {
4414ffd830a3SStefano Zampini       ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_phi_D,"phi_D");CHKERRQ(ierr);
4415ffd830a3SStefano Zampini       ierr = MatView(pcbddc->coarse_phi_D,viewer);CHKERRQ(ierr);
4416ffd830a3SStefano Zampini     }
4417ffd830a3SStefano Zampini     if (pcbddc->coarse_psi_B) {
4418ffd830a3SStefano Zampini       ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_psi_B,"psi_B");CHKERRQ(ierr);
4419ffd830a3SStefano Zampini       ierr = MatView(pcbddc->coarse_psi_B,viewer);CHKERRQ(ierr);
4420ffd830a3SStefano Zampini     }
442172b8c272SStefano Zampini     if (pcbddc->coarse_psi_D) {
4422ffd830a3SStefano Zampini       ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_psi_D,"psi_D");CHKERRQ(ierr);
4423ffd830a3SStefano Zampini       ierr = MatView(pcbddc->coarse_psi_D,viewer);CHKERRQ(ierr);
4424ffd830a3SStefano Zampini     }
4425d12edf2fSStefano Zampini     ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr);
4426d12edf2fSStefano Zampini   }
4427d12edf2fSStefano Zampini #endif
442881d9aea3SBarry Smith     ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
44298bec7fa6SStefano Zampini     ierr = MatNorm(TM1,NORM_FROBENIUS,&real_value);CHKERRQ(ierr);
44301575c14dSBarry Smith     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
443106656605SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d          matrix error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr);
44328bec7fa6SStefano Zampini 
44338bec7fa6SStefano Zampini     /* check constraints */
4434a00504b5SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size-pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr);
44357dae84e0SHong Zhang     ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&C_B);CHKERRQ(ierr);
44364f1b2e48SStefano Zampini     if (!pcbddc->benign_n) { /* TODO: add benign case */
44378bec7fa6SStefano Zampini       ierr = MatMatMult(C_B,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&CPHI);CHKERRQ(ierr);
4438a00504b5SStefano Zampini     } else {
4439a00504b5SStefano Zampini       PetscScalar *data;
4440a00504b5SStefano Zampini       Mat         tmat;
4441a00504b5SStefano Zampini       ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&data);CHKERRQ(ierr);
4442a00504b5SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcis->n_B,pcbddc->local_primal_size-pcbddc->benign_n,data,&tmat);CHKERRQ(ierr);
4443a00504b5SStefano Zampini       ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&data);CHKERRQ(ierr);
4444a00504b5SStefano Zampini       ierr = MatMatMult(C_B,tmat,MAT_INITIAL_MATRIX,1.0,&CPHI);CHKERRQ(ierr);
4445a00504b5SStefano Zampini       ierr = MatDestroy(&tmat);CHKERRQ(ierr);
4446a00504b5SStefano Zampini     }
44478bec7fa6SStefano Zampini     ierr = MatCreateVecs(CPHI,&mones,NULL);CHKERRQ(ierr);
44488bec7fa6SStefano Zampini     ierr = VecSet(mones,-1.0);CHKERRQ(ierr);
44498bec7fa6SStefano Zampini     ierr = MatDiagonalSet(CPHI,mones,ADD_VALUES);CHKERRQ(ierr);
44508bec7fa6SStefano Zampini     ierr = MatNorm(CPHI,NORM_FROBENIUS,&real_value);CHKERRQ(ierr);
4451bdae7319SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d phi constraints error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr);
4452ffd830a3SStefano Zampini     if (!pcbddc->symmetric_primal) {
4453bdae7319SStefano Zampini       ierr = MatMatMult(C_B,coarse_psi_B,MAT_REUSE_MATRIX,1.0,&CPHI);CHKERRQ(ierr);
4454bdae7319SStefano Zampini       ierr = VecSet(mones,-1.0);CHKERRQ(ierr);
4455bdae7319SStefano Zampini       ierr = MatDiagonalSet(CPHI,mones,ADD_VALUES);CHKERRQ(ierr);
4456bdae7319SStefano Zampini       ierr = MatNorm(CPHI,NORM_FROBENIUS,&real_value);CHKERRQ(ierr);
4457bdae7319SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d psi constraints error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr);
445888ebb749SStefano Zampini     }
44598bec7fa6SStefano Zampini     ierr = MatDestroy(&C_B);CHKERRQ(ierr);
44608bec7fa6SStefano Zampini     ierr = MatDestroy(&CPHI);CHKERRQ(ierr);
44618bec7fa6SStefano Zampini     ierr = ISDestroy(&is_dummy);CHKERRQ(ierr);
44628bec7fa6SStefano Zampini     ierr = VecDestroy(&mones);CHKERRQ(ierr);
446325084f0cSStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
446488ebb749SStefano Zampini     ierr = MatDestroy(&A_II);CHKERRQ(ierr);
446588ebb749SStefano Zampini     ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
446688ebb749SStefano Zampini     ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
446788ebb749SStefano Zampini     ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
446888ebb749SStefano Zampini     ierr = MatDestroy(&TM1);CHKERRQ(ierr);
446988ebb749SStefano Zampini     ierr = MatDestroy(&TM2);CHKERRQ(ierr);
447088ebb749SStefano Zampini     ierr = MatDestroy(&TM3);CHKERRQ(ierr);
447188ebb749SStefano Zampini     ierr = MatDestroy(&TM4);CHKERRQ(ierr);
447288ebb749SStefano Zampini     ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
447388ebb749SStefano Zampini     ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
4474ffd830a3SStefano Zampini     if (!pcbddc->symmetric_primal) {
447588ebb749SStefano Zampini       ierr = MatDestroy(&coarse_psi_D);CHKERRQ(ierr);
447688ebb749SStefano Zampini       ierr = MatDestroy(&coarse_psi_B);CHKERRQ(ierr);
447788ebb749SStefano Zampini     }
447888ebb749SStefano Zampini     ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
447988ebb749SStefano Zampini   }
44808629588bSStefano Zampini   /* get back data */
44818629588bSStefano Zampini   *coarse_submat_vals_n = coarse_submat_vals;
448288ebb749SStefano Zampini   PetscFunctionReturn(0);
448388ebb749SStefano Zampini }
448488ebb749SStefano Zampini 
44857dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrixUnsorted(Mat A, IS isrow, IS iscol, Mat* B)
4486aa0d41d4SStefano Zampini {
4487d65f70fdSStefano Zampini   Mat            *work_mat;
4488d65f70fdSStefano Zampini   IS             isrow_s,iscol_s;
4489d65f70fdSStefano Zampini   PetscBool      rsorted,csorted;
4490c43ebad9SStefano Zampini   PetscInt       rsize,*idxs_perm_r=NULL,csize,*idxs_perm_c=NULL;
4491aa0d41d4SStefano Zampini   PetscErrorCode ierr;
4492aa0d41d4SStefano Zampini 
4493aa0d41d4SStefano Zampini   PetscFunctionBegin;
4494d65f70fdSStefano Zampini   ierr = ISSorted(isrow,&rsorted);CHKERRQ(ierr);
4495d65f70fdSStefano Zampini   ierr = ISSorted(iscol,&csorted);CHKERRQ(ierr);
4496d65f70fdSStefano Zampini   ierr = ISGetLocalSize(isrow,&rsize);CHKERRQ(ierr);
4497d65f70fdSStefano Zampini   ierr = ISGetLocalSize(iscol,&csize);CHKERRQ(ierr);
4498aa0d41d4SStefano Zampini 
4499d65f70fdSStefano Zampini   if (!rsorted) {
4500906d46d4SStefano Zampini     const PetscInt *idxs;
4501906d46d4SStefano Zampini     PetscInt *idxs_sorted,i;
4502aa0d41d4SStefano Zampini 
4503d65f70fdSStefano Zampini     ierr = PetscMalloc1(rsize,&idxs_perm_r);CHKERRQ(ierr);
4504d65f70fdSStefano Zampini     ierr = PetscMalloc1(rsize,&idxs_sorted);CHKERRQ(ierr);
4505d65f70fdSStefano Zampini     for (i=0;i<rsize;i++) {
4506d65f70fdSStefano Zampini       idxs_perm_r[i] = i;
4507aa0d41d4SStefano Zampini     }
4508d65f70fdSStefano Zampini     ierr = ISGetIndices(isrow,&idxs);CHKERRQ(ierr);
4509d65f70fdSStefano Zampini     ierr = PetscSortIntWithPermutation(rsize,idxs,idxs_perm_r);CHKERRQ(ierr);
4510d65f70fdSStefano Zampini     for (i=0;i<rsize;i++) {
4511d65f70fdSStefano Zampini       idxs_sorted[i] = idxs[idxs_perm_r[i]];
4512aa0d41d4SStefano Zampini     }
4513d65f70fdSStefano Zampini     ierr = ISRestoreIndices(isrow,&idxs);CHKERRQ(ierr);
4514d65f70fdSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,rsize,idxs_sorted,PETSC_OWN_POINTER,&isrow_s);CHKERRQ(ierr);
4515d65f70fdSStefano Zampini   } else {
4516d65f70fdSStefano Zampini     ierr = PetscObjectReference((PetscObject)isrow);CHKERRQ(ierr);
4517d65f70fdSStefano Zampini     isrow_s = isrow;
4518aa0d41d4SStefano Zampini   }
4519906d46d4SStefano Zampini 
4520d65f70fdSStefano Zampini   if (!csorted) {
4521d65f70fdSStefano Zampini     if (isrow == iscol) {
4522d65f70fdSStefano Zampini       ierr = PetscObjectReference((PetscObject)isrow_s);CHKERRQ(ierr);
4523d65f70fdSStefano Zampini       iscol_s = isrow_s;
4524d65f70fdSStefano Zampini     } else {
4525d65f70fdSStefano Zampini       const PetscInt *idxs;
4526d65f70fdSStefano Zampini       PetscInt       *idxs_sorted,i;
4527906d46d4SStefano Zampini 
4528d65f70fdSStefano Zampini       ierr = PetscMalloc1(csize,&idxs_perm_c);CHKERRQ(ierr);
4529d65f70fdSStefano Zampini       ierr = PetscMalloc1(csize,&idxs_sorted);CHKERRQ(ierr);
4530d65f70fdSStefano Zampini       for (i=0;i<csize;i++) {
4531d65f70fdSStefano Zampini         idxs_perm_c[i] = i;
4532d65f70fdSStefano Zampini       }
4533d65f70fdSStefano Zampini       ierr = ISGetIndices(iscol,&idxs);CHKERRQ(ierr);
4534d65f70fdSStefano Zampini       ierr = PetscSortIntWithPermutation(csize,idxs,idxs_perm_c);CHKERRQ(ierr);
4535d65f70fdSStefano Zampini       for (i=0;i<csize;i++) {
4536d65f70fdSStefano Zampini         idxs_sorted[i] = idxs[idxs_perm_c[i]];
4537d65f70fdSStefano Zampini       }
4538d65f70fdSStefano Zampini       ierr = ISRestoreIndices(iscol,&idxs);CHKERRQ(ierr);
4539d65f70fdSStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,csize,idxs_sorted,PETSC_OWN_POINTER,&iscol_s);CHKERRQ(ierr);
4540d65f70fdSStefano Zampini     }
4541d65f70fdSStefano Zampini   } else {
4542d65f70fdSStefano Zampini     ierr = PetscObjectReference((PetscObject)iscol);CHKERRQ(ierr);
4543d65f70fdSStefano Zampini     iscol_s = iscol;
4544d65f70fdSStefano Zampini   }
4545d65f70fdSStefano Zampini 
45467dae84e0SHong Zhang   ierr = MatCreateSubMatrices(A,1,&isrow_s,&iscol_s,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr);
4547d65f70fdSStefano Zampini 
4548d65f70fdSStefano Zampini   if (!rsorted || !csorted) {
4549906d46d4SStefano Zampini     Mat      new_mat;
4550d65f70fdSStefano Zampini     IS       is_perm_r,is_perm_c;
4551906d46d4SStefano Zampini 
4552d65f70fdSStefano Zampini     if (!rsorted) {
4553d65f70fdSStefano Zampini       PetscInt *idxs_r,i;
4554d65f70fdSStefano Zampini       ierr = PetscMalloc1(rsize,&idxs_r);CHKERRQ(ierr);
4555d65f70fdSStefano Zampini       for (i=0;i<rsize;i++) {
4556d65f70fdSStefano Zampini         idxs_r[idxs_perm_r[i]] = i;
4557906d46d4SStefano Zampini       }
4558d65f70fdSStefano Zampini       ierr = PetscFree(idxs_perm_r);CHKERRQ(ierr);
4559d65f70fdSStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,rsize,idxs_r,PETSC_OWN_POINTER,&is_perm_r);CHKERRQ(ierr);
4560d65f70fdSStefano Zampini     } else {
4561d65f70fdSStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,rsize,0,1,&is_perm_r);CHKERRQ(ierr);
4562906d46d4SStefano Zampini     }
4563d65f70fdSStefano Zampini     ierr = ISSetPermutation(is_perm_r);CHKERRQ(ierr);
4564d65f70fdSStefano Zampini 
4565d65f70fdSStefano Zampini     if (!csorted) {
4566d65f70fdSStefano Zampini       if (isrow_s == iscol_s) {
4567d65f70fdSStefano Zampini         ierr = PetscObjectReference((PetscObject)is_perm_r);CHKERRQ(ierr);
4568d65f70fdSStefano Zampini         is_perm_c = is_perm_r;
4569d65f70fdSStefano Zampini       } else {
4570d65f70fdSStefano Zampini         PetscInt *idxs_c,i;
4571f913dca9SStefano Zampini         if (!idxs_perm_c) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Permutation array not present");
4572d65f70fdSStefano Zampini         ierr = PetscMalloc1(csize,&idxs_c);CHKERRQ(ierr);
4573d65f70fdSStefano Zampini         for (i=0;i<csize;i++) {
4574d65f70fdSStefano Zampini           idxs_c[idxs_perm_c[i]] = i;
4575d65f70fdSStefano Zampini         }
4576d65f70fdSStefano Zampini         ierr = PetscFree(idxs_perm_c);CHKERRQ(ierr);
4577d65f70fdSStefano Zampini         ierr = ISCreateGeneral(PETSC_COMM_SELF,csize,idxs_c,PETSC_OWN_POINTER,&is_perm_c);CHKERRQ(ierr);
4578d65f70fdSStefano Zampini       }
4579d65f70fdSStefano Zampini     } else {
4580d65f70fdSStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,csize,0,1,&is_perm_c);CHKERRQ(ierr);
4581d65f70fdSStefano Zampini     }
4582d65f70fdSStefano Zampini     ierr = ISSetPermutation(is_perm_c);CHKERRQ(ierr);
4583d65f70fdSStefano Zampini 
4584d65f70fdSStefano Zampini     ierr = MatPermute(work_mat[0],is_perm_r,is_perm_c,&new_mat);CHKERRQ(ierr);
4585d65f70fdSStefano Zampini     ierr = MatDestroy(&work_mat[0]);CHKERRQ(ierr);
4586d65f70fdSStefano Zampini     work_mat[0] = new_mat;
4587d65f70fdSStefano Zampini     ierr = ISDestroy(&is_perm_r);CHKERRQ(ierr);
4588d65f70fdSStefano Zampini     ierr = ISDestroy(&is_perm_c);CHKERRQ(ierr);
4589d65f70fdSStefano Zampini   }
4590d65f70fdSStefano Zampini 
4591d65f70fdSStefano Zampini   ierr = PetscObjectReference((PetscObject)work_mat[0]);CHKERRQ(ierr);
4592d65f70fdSStefano Zampini   *B = work_mat[0];
4593d65f70fdSStefano Zampini   ierr = MatDestroyMatrices(1,&work_mat);CHKERRQ(ierr);
4594d65f70fdSStefano Zampini   ierr = ISDestroy(&isrow_s);CHKERRQ(ierr);
4595d65f70fdSStefano Zampini   ierr = ISDestroy(&iscol_s);CHKERRQ(ierr);
4596d65f70fdSStefano Zampini   PetscFunctionReturn(0);
4597d65f70fdSStefano Zampini }
4598d65f70fdSStefano Zampini 
45995e8657edSStefano Zampini PetscErrorCode PCBDDCComputeLocalMatrix(PC pc, Mat ChangeOfBasisMatrix)
4600aa0d41d4SStefano Zampini {
4601aa0d41d4SStefano Zampini   Mat_IS*        matis = (Mat_IS*)pc->pmat->data;
46025e8657edSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
4603022d8d2bSstefano_zampini   Mat            new_mat,lA;
46045e8657edSStefano Zampini   IS             is_local,is_global;
4605d65f70fdSStefano Zampini   PetscInt       local_size;
4606d65f70fdSStefano Zampini   PetscBool      isseqaij;
4607aa0d41d4SStefano Zampini   PetscErrorCode ierr;
4608aa0d41d4SStefano Zampini 
4609aa0d41d4SStefano Zampini   PetscFunctionBegin;
4610aa0d41d4SStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
46115e8657edSStefano Zampini   ierr = MatGetSize(matis->A,&local_size,NULL);CHKERRQ(ierr);
46125e8657edSStefano Zampini   ierr = ISCreateStride(PetscObjectComm((PetscObject)matis->A),local_size,0,1,&is_local);CHKERRQ(ierr);
4613b087196eSStefano Zampini   ierr = ISLocalToGlobalMappingApplyIS(pc->pmat->rmap->mapping,is_local,&is_global);CHKERRQ(ierr);
4614aa0d41d4SStefano Zampini   ierr = ISDestroy(&is_local);CHKERRQ(ierr);
46157dae84e0SHong Zhang   ierr = MatCreateSubMatrixUnsorted(ChangeOfBasisMatrix,is_global,is_global,&new_mat);CHKERRQ(ierr);
4616aa0d41d4SStefano Zampini   ierr = ISDestroy(&is_global);CHKERRQ(ierr);
4617906d46d4SStefano Zampini 
4618906d46d4SStefano Zampini   /* check */
4619906d46d4SStefano Zampini   if (pcbddc->dbg_flag) {
4620906d46d4SStefano Zampini     Vec       x,x_change;
4621906d46d4SStefano Zampini     PetscReal error;
4622906d46d4SStefano Zampini 
46235e8657edSStefano Zampini     ierr = MatCreateVecs(ChangeOfBasisMatrix,&x,&x_change);CHKERRQ(ierr);
4624906d46d4SStefano Zampini     ierr = VecSetRandom(x,NULL);CHKERRQ(ierr);
46255e8657edSStefano Zampini     ierr = MatMult(ChangeOfBasisMatrix,x,x_change);CHKERRQ(ierr);
4626e176bc59SStefano Zampini     ierr = VecScatterBegin(matis->cctx,x,matis->x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4627e176bc59SStefano Zampini     ierr = VecScatterEnd(matis->cctx,x,matis->x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4628d65f70fdSStefano Zampini     ierr = MatMult(new_mat,matis->x,matis->y);CHKERRQ(ierr);
462988428137SStefano Zampini     if (!pcbddc->change_interior) {
463088428137SStefano Zampini       const PetscScalar *x,*y,*v;
463188428137SStefano Zampini       PetscReal         lerror = 0.;
463288428137SStefano Zampini       PetscInt          i;
463388428137SStefano Zampini 
463488428137SStefano Zampini       ierr = VecGetArrayRead(matis->x,&x);CHKERRQ(ierr);
463588428137SStefano Zampini       ierr = VecGetArrayRead(matis->y,&y);CHKERRQ(ierr);
463688428137SStefano Zampini       ierr = VecGetArrayRead(matis->counter,&v);CHKERRQ(ierr);
463788428137SStefano Zampini       for (i=0;i<local_size;i++)
463888428137SStefano Zampini         if (PetscRealPart(v[i]) < 1.5 && PetscAbsScalar(x[i]-y[i]) > lerror)
463988428137SStefano Zampini           lerror = PetscAbsScalar(x[i]-y[i]);
464088428137SStefano Zampini       ierr = VecRestoreArrayRead(matis->x,&x);CHKERRQ(ierr);
464188428137SStefano Zampini       ierr = VecRestoreArrayRead(matis->y,&y);CHKERRQ(ierr);
464288428137SStefano Zampini       ierr = VecRestoreArrayRead(matis->counter,&v);CHKERRQ(ierr);
464388428137SStefano Zampini       ierr = MPIU_Allreduce(&lerror,&error,1,MPIU_REAL,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
4644637e8532SStefano Zampini       if (error > PETSC_SMALL) {
4645637e8532SStefano Zampini         if (!pcbddc->user_ChangeOfBasisMatrix || pcbddc->current_level) {
4646637e8532SStefano Zampini           SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on I: %1.6e\n",error);
4647637e8532SStefano Zampini         } else {
4648637e8532SStefano Zampini           SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Error global vs local change on I: %1.6e\n",error);
4649637e8532SStefano Zampini         }
4650637e8532SStefano Zampini       }
465188428137SStefano Zampini     }
4652e176bc59SStefano Zampini     ierr = VecScatterBegin(matis->rctx,matis->y,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4653e176bc59SStefano Zampini     ierr = VecScatterEnd(matis->rctx,matis->y,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4654906d46d4SStefano Zampini     ierr = VecAXPY(x,-1.0,x_change);CHKERRQ(ierr);
4655906d46d4SStefano Zampini     ierr = VecNorm(x,NORM_INFINITY,&error);CHKERRQ(ierr);
4656637e8532SStefano Zampini     if (error > PETSC_SMALL) {
4657637e8532SStefano Zampini       if (!pcbddc->user_ChangeOfBasisMatrix || pcbddc->current_level) {
4658637e8532SStefano Zampini         SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on N: %1.6e\n",error);
4659637e8532SStefano Zampini       } else {
4660637e8532SStefano Zampini         SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Error global vs local change on N: %1.6e\n",error);
4661637e8532SStefano Zampini       }
4662637e8532SStefano Zampini     }
4663906d46d4SStefano Zampini     ierr = VecDestroy(&x);CHKERRQ(ierr);
4664906d46d4SStefano Zampini     ierr = VecDestroy(&x_change);CHKERRQ(ierr);
4665906d46d4SStefano Zampini   }
4666906d46d4SStefano Zampini 
4667022d8d2bSstefano_zampini   /* lA is present if we are setting up an inner BDDC for a saddle point FETI-DP */
4668022d8d2bSstefano_zampini   ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject*)&lA);CHKERRQ(ierr);
4669022d8d2bSstefano_zampini 
467022d5777bSStefano Zampini   /* TODO: HOW TO WORK WITH BAIJ and SBAIJ and SEQDENSE? */
46719b28b3ffSStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)matis->A,MATSEQAIJ,&isseqaij);CHKERRQ(ierr);
467222d5777bSStefano Zampini   if (isseqaij) {
4673a00504b5SStefano Zampini     ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
4674a00504b5SStefano Zampini     ierr = MatPtAP(matis->A,new_mat,MAT_INITIAL_MATRIX,2.0,&pcbddc->local_mat);CHKERRQ(ierr);
4675022d8d2bSstefano_zampini     if (lA) {
4676022d8d2bSstefano_zampini       Mat work;
4677022d8d2bSstefano_zampini       ierr = MatPtAP(lA,new_mat,MAT_INITIAL_MATRIX,2.0,&work);CHKERRQ(ierr);
4678022d8d2bSstefano_zampini       ierr = PetscObjectCompose((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject)work);CHKERRQ(ierr);
4679022d8d2bSstefano_zampini       ierr = MatDestroy(&work);CHKERRQ(ierr);
4680022d8d2bSstefano_zampini     }
4681aa0d41d4SStefano Zampini   } else {
4682a00504b5SStefano Zampini     Mat work_mat;
46831cf9b237SStefano Zampini 
4684a00504b5SStefano Zampini     ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
4685aa0d41d4SStefano Zampini     ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr);
4686a00504b5SStefano Zampini     ierr = MatPtAP(work_mat,new_mat,MAT_INITIAL_MATRIX,2.0,&pcbddc->local_mat);CHKERRQ(ierr);
46871d82a3b6SStefano Zampini     ierr = MatDestroy(&work_mat);CHKERRQ(ierr);
4688022d8d2bSstefano_zampini     if (lA) {
4689022d8d2bSstefano_zampini       Mat work;
4690022d8d2bSstefano_zampini       ierr = MatConvert(lA,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr);
4691022d8d2bSstefano_zampini       ierr = MatPtAP(work_mat,new_mat,MAT_INITIAL_MATRIX,2.0,&work);CHKERRQ(ierr);
4692022d8d2bSstefano_zampini       ierr = PetscObjectCompose((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject)work);CHKERRQ(ierr);
4693022d8d2bSstefano_zampini       ierr = MatDestroy(&work);CHKERRQ(ierr);
4694022d8d2bSstefano_zampini     }
4695aa0d41d4SStefano Zampini   }
46963301b35fSStefano Zampini   if (matis->A->symmetric_set) {
46973301b35fSStefano Zampini     ierr = MatSetOption(pcbddc->local_mat,MAT_SYMMETRIC,matis->A->symmetric);CHKERRQ(ierr);
4698e496cd5dSStefano Zampini #if !defined(PETSC_USE_COMPLEX)
46993301b35fSStefano Zampini     ierr = MatSetOption(pcbddc->local_mat,MAT_HERMITIAN,matis->A->symmetric);CHKERRQ(ierr);
4700e496cd5dSStefano Zampini #endif
47013301b35fSStefano Zampini   }
4702d65f70fdSStefano Zampini   ierr = MatDestroy(&new_mat);CHKERRQ(ierr);
4703aa0d41d4SStefano Zampini   PetscFunctionReturn(0);
4704aa0d41d4SStefano Zampini }
4705aa0d41d4SStefano Zampini 
47068ce42a96SStefano Zampini PetscErrorCode PCBDDCSetUpLocalScatters(PC pc)
4707a64d13efSStefano Zampini {
4708a64d13efSStefano Zampini   PC_IS*          pcis = (PC_IS*)(pc->data);
4709a64d13efSStefano Zampini   PC_BDDC*        pcbddc = (PC_BDDC*)pc->data;
4710d62866d3SStefano Zampini   PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
471153892102SStefano Zampini   PetscInt        *idx_R_local=NULL;
47123a50541eSStefano Zampini   PetscInt        n_vertices,i,j,n_R,n_D,n_B;
47133a50541eSStefano Zampini   PetscInt        vbs,bs;
47146816873aSStefano Zampini   PetscBT         bitmask=NULL;
4715a64d13efSStefano Zampini   PetscErrorCode  ierr;
4716a64d13efSStefano Zampini 
4717a64d13efSStefano Zampini   PetscFunctionBegin;
4718b23d619eSStefano Zampini   /*
4719b23d619eSStefano Zampini     No need to setup local scatters if
4720b23d619eSStefano Zampini       - primal space is unchanged
4721b23d619eSStefano Zampini         AND
4722b23d619eSStefano Zampini       - we actually have locally some primal dofs (could not be true in multilevel or for isolated subdomains)
4723b23d619eSStefano Zampini         AND
4724b23d619eSStefano Zampini       - we are not in debugging mode (this is needed since there are Synchronized prints at the end of the subroutine
4725b23d619eSStefano Zampini   */
4726b23d619eSStefano Zampini   if (!pcbddc->new_primal_space_local && pcbddc->local_primal_size && !pcbddc->dbg_flag) {
4727f4ddd8eeSStefano Zampini     PetscFunctionReturn(0);
4728f4ddd8eeSStefano Zampini   }
4729f4ddd8eeSStefano Zampini   /* destroy old objects */
4730f4ddd8eeSStefano Zampini   ierr = ISDestroy(&pcbddc->is_R_local);CHKERRQ(ierr);
4731f4ddd8eeSStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
4732f4ddd8eeSStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
4733a64d13efSStefano Zampini   /* Set Non-overlapping dimensions */
4734b371cd4fSStefano Zampini   n_B = pcis->n_B;
4735b371cd4fSStefano Zampini   n_D = pcis->n - n_B;
4736b371cd4fSStefano Zampini   n_vertices = pcbddc->n_vertices;
47373a50541eSStefano Zampini 
4738a64d13efSStefano Zampini   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
47396816873aSStefano Zampini 
474053892102SStefano Zampini   /* create auxiliary bitmask and allocate workspace */
4741b334f244SStefano Zampini   if (!sub_schurs || !sub_schurs->reuse_solver) {
4742854ce69bSBarry Smith     ierr = PetscMalloc1(pcis->n-n_vertices,&idx_R_local);CHKERRQ(ierr);
4743a64d13efSStefano Zampini     ierr = PetscBTCreate(pcis->n,&bitmask);CHKERRQ(ierr);
4744a64d13efSStefano Zampini     for (i=0;i<n_vertices;i++) {
47450e6343abSStefano Zampini       ierr = PetscBTSet(bitmask,pcbddc->local_primal_ref_node[i]);CHKERRQ(ierr);
4746a64d13efSStefano Zampini     }
4747a64d13efSStefano Zampini 
4748a64d13efSStefano Zampini     for (i=0, n_R=0; i<pcis->n; i++) {
47494641a718SStefano Zampini       if (!PetscBTLookup(bitmask,i)) {
47506816873aSStefano Zampini         idx_R_local[n_R++] = i;
4751a64d13efSStefano Zampini       }
4752a64d13efSStefano Zampini     }
4753df4d28bfSStefano Zampini   } else { /* A different ordering (already computed) is present if we are reusing the Schur solver */
4754df4d28bfSStefano Zampini     PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
47556816873aSStefano Zampini 
4756df4d28bfSStefano Zampini     ierr = ISGetIndices(reuse_solver->is_R,(const PetscInt**)&idx_R_local);CHKERRQ(ierr);
4757df4d28bfSStefano Zampini     ierr = ISGetLocalSize(reuse_solver->is_R,&n_R);CHKERRQ(ierr);
47586816873aSStefano Zampini   }
47593a50541eSStefano Zampini 
47603a50541eSStefano Zampini   /* Block code */
47613a50541eSStefano Zampini   vbs = 1;
47623a50541eSStefano Zampini   ierr = MatGetBlockSize(pcbddc->local_mat,&bs);CHKERRQ(ierr);
47633a50541eSStefano Zampini   if (bs>1 && !(n_vertices%bs)) {
47643a50541eSStefano Zampini     PetscBool is_blocked = PETSC_TRUE;
47653a50541eSStefano Zampini     PetscInt  *vary;
4766b334f244SStefano Zampini     if (!sub_schurs || !sub_schurs->reuse_solver) {
4767785e854fSJed Brown       ierr = PetscMalloc1(pcis->n/bs,&vary);CHKERRQ(ierr);
47683a50541eSStefano Zampini       ierr = PetscMemzero(vary,pcis->n/bs*sizeof(PetscInt));CHKERRQ(ierr);
4769d3df7717SStefano Zampini       /* Verify that the vertex indices correspond to each element in a block (code taken from sbaij2.c) */
4770d3df7717SStefano Zampini       /* it is ok to check this way since local_primal_ref_node are always sorted by local numbering and idx_R_local is obtained as a complement */
47710e6343abSStefano Zampini       for (i=0; i<n_vertices; i++) vary[pcbddc->local_primal_ref_node[i]/bs]++;
4772d3df7717SStefano Zampini       for (i=0; i<pcis->n/bs; i++) {
47733a50541eSStefano Zampini         if (vary[i]!=0 && vary[i]!=bs) {
47743a50541eSStefano Zampini           is_blocked = PETSC_FALSE;
47753a50541eSStefano Zampini           break;
47763a50541eSStefano Zampini         }
47773a50541eSStefano Zampini       }
4778d3df7717SStefano Zampini       ierr = PetscFree(vary);CHKERRQ(ierr);
4779d3df7717SStefano Zampini     } else {
4780d3df7717SStefano Zampini       /* Verify directly the R set */
4781d3df7717SStefano Zampini       for (i=0; i<n_R/bs; i++) {
4782d3df7717SStefano Zampini         PetscInt j,node=idx_R_local[bs*i];
4783d3df7717SStefano Zampini         for (j=1; j<bs; j++) {
4784d3df7717SStefano Zampini           if (node != idx_R_local[bs*i+j]-j) {
4785d3df7717SStefano Zampini             is_blocked = PETSC_FALSE;
4786d3df7717SStefano Zampini             break;
4787d3df7717SStefano Zampini           }
4788d3df7717SStefano Zampini         }
4789d3df7717SStefano Zampini       }
4790d3df7717SStefano Zampini     }
47913a50541eSStefano Zampini     if (is_blocked) { /* build compressed IS for R nodes (complement of vertices) */
47923a50541eSStefano Zampini       vbs = bs;
47933a50541eSStefano Zampini       for (i=0;i<n_R/vbs;i++) {
47943a50541eSStefano Zampini         idx_R_local[i] = idx_R_local[vbs*i]/vbs;
47953a50541eSStefano Zampini       }
47963a50541eSStefano Zampini     }
47973a50541eSStefano Zampini   }
47983a50541eSStefano Zampini   ierr = ISCreateBlock(PETSC_COMM_SELF,vbs,n_R/vbs,idx_R_local,PETSC_COPY_VALUES,&pcbddc->is_R_local);CHKERRQ(ierr);
4799b334f244SStefano Zampini   if (sub_schurs && sub_schurs->reuse_solver) {
4800df4d28bfSStefano Zampini     PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
480153892102SStefano Zampini 
4802df4d28bfSStefano Zampini     ierr = ISRestoreIndices(reuse_solver->is_R,(const PetscInt**)&idx_R_local);CHKERRQ(ierr);
4803df4d28bfSStefano Zampini     ierr = ISDestroy(&reuse_solver->is_R);CHKERRQ(ierr);
480453892102SStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->is_R_local);CHKERRQ(ierr);
4805df4d28bfSStefano Zampini     reuse_solver->is_R = pcbddc->is_R_local;
480653892102SStefano Zampini   } else {
48073a50541eSStefano Zampini     ierr = PetscFree(idx_R_local);CHKERRQ(ierr);
480853892102SStefano Zampini   }
4809a64d13efSStefano Zampini 
4810a64d13efSStefano Zampini   /* print some info if requested */
4811a64d13efSStefano Zampini   if (pcbddc->dbg_flag) {
4812a64d13efSStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
4813a64d13efSStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
48141575c14dSBarry Smith     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
4815a64d13efSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
4816a64d13efSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
48174f1b2e48SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,pcbddc->local_primal_size-n_vertices-pcbddc->benign_n,pcbddc->local_primal_size);CHKERRQ(ierr);
4818a64d13efSStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
4819a64d13efSStefano Zampini   }
4820a64d13efSStefano Zampini 
4821a64d13efSStefano Zampini   /* VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
4822b334f244SStefano Zampini   if (!sub_schurs || !sub_schurs->reuse_solver) {
48236816873aSStefano Zampini     IS       is_aux1,is_aux2;
48246816873aSStefano Zampini     PetscInt *aux_array1,*aux_array2,*is_indices,*idx_R_local;
48256816873aSStefano Zampini 
48263a50541eSStefano Zampini     ierr = ISGetIndices(pcbddc->is_R_local,(const PetscInt**)&idx_R_local);CHKERRQ(ierr);
4827854ce69bSBarry Smith     ierr = PetscMalloc1(pcis->n_B-n_vertices,&aux_array1);CHKERRQ(ierr);
4828854ce69bSBarry Smith     ierr = PetscMalloc1(pcis->n_B-n_vertices,&aux_array2);CHKERRQ(ierr);
4829a64d13efSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
48304641a718SStefano Zampini     for (i=0; i<n_D; i++) {
48314641a718SStefano Zampini       ierr = PetscBTSet(bitmask,is_indices[i]);CHKERRQ(ierr);
48324641a718SStefano Zampini     }
4833a64d13efSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4834a64d13efSStefano Zampini     for (i=0, j=0; i<n_R; i++) {
48354641a718SStefano Zampini       if (!PetscBTLookup(bitmask,idx_R_local[i])) {
48364641a718SStefano Zampini         aux_array1[j++] = i;
4837a64d13efSStefano Zampini       }
4838a64d13efSStefano Zampini     }
4839a64d13efSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_OWN_POINTER,&is_aux1);CHKERRQ(ierr);
4840a64d13efSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4841a64d13efSStefano Zampini     for (i=0, j=0; i<n_B; i++) {
48424641a718SStefano Zampini       if (!PetscBTLookup(bitmask,is_indices[i])) {
48434641a718SStefano Zampini         aux_array2[j++] = i;
4844a64d13efSStefano Zampini       }
4845a64d13efSStefano Zampini     }
4846a64d13efSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4847a64d13efSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_OWN_POINTER,&is_aux2);CHKERRQ(ierr);
4848a64d13efSStefano Zampini     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
4849a64d13efSStefano Zampini     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
4850a64d13efSStefano Zampini     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
4851a64d13efSStefano Zampini 
48528eeda7d8SStefano Zampini     if (pcbddc->switch_static || pcbddc->dbg_flag) {
4853785e854fSJed Brown       ierr = PetscMalloc1(n_D,&aux_array1);CHKERRQ(ierr);
4854a64d13efSStefano Zampini       for (i=0, j=0; i<n_R; i++) {
48554641a718SStefano Zampini         if (PetscBTLookup(bitmask,idx_R_local[i])) {
48564641a718SStefano Zampini           aux_array1[j++] = i;
4857a64d13efSStefano Zampini         }
4858a64d13efSStefano Zampini       }
4859a64d13efSStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_OWN_POINTER,&is_aux1);CHKERRQ(ierr);
4860a64d13efSStefano Zampini       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
4861a64d13efSStefano Zampini       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
4862a64d13efSStefano Zampini     }
48634641a718SStefano Zampini     ierr = PetscBTDestroy(&bitmask);CHKERRQ(ierr);
48643a50541eSStefano Zampini     ierr = ISRestoreIndices(pcbddc->is_R_local,(const PetscInt**)&idx_R_local);CHKERRQ(ierr);
4865d62866d3SStefano Zampini   } else {
4866df4d28bfSStefano Zampini     PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
48676816873aSStefano Zampini     IS                 tis;
48686816873aSStefano Zampini     PetscInt           schur_size;
48696816873aSStefano Zampini 
4870df4d28bfSStefano Zampini     ierr = ISGetLocalSize(reuse_solver->is_B,&schur_size);CHKERRQ(ierr);
48716816873aSStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,schur_size,n_D,1,&tis);CHKERRQ(ierr);
4872df4d28bfSStefano Zampini     ierr = VecScatterCreate(pcbddc->vec1_R,tis,pcis->vec1_B,reuse_solver->is_B,&pcbddc->R_to_B);CHKERRQ(ierr);
48736816873aSStefano Zampini     ierr = ISDestroy(&tis);CHKERRQ(ierr);
48746816873aSStefano Zampini     if (pcbddc->switch_static || pcbddc->dbg_flag) {
48756816873aSStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_D,0,1,&tis);CHKERRQ(ierr);
48766816873aSStefano Zampini       ierr = VecScatterCreate(pcbddc->vec1_R,tis,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
48776816873aSStefano Zampini       ierr = ISDestroy(&tis);CHKERRQ(ierr);
4878d62866d3SStefano Zampini     }
4879d62866d3SStefano Zampini   }
4880a64d13efSStefano Zampini   PetscFunctionReturn(0);
4881a64d13efSStefano Zampini }
4882a64d13efSStefano Zampini 
4883304d26faSStefano Zampini 
4884684f6988SStefano Zampini PetscErrorCode PCBDDCSetUpLocalSolvers(PC pc, PetscBool dirichlet, PetscBool neumann)
4885304d26faSStefano Zampini {
4886304d26faSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
4887304d26faSStefano Zampini   PC_IS          *pcis = (PC_IS*)pc->data;
4888304d26faSStefano Zampini   PC             pc_temp;
4889304d26faSStefano Zampini   Mat            A_RR;
4890f4ddd8eeSStefano Zampini   MatReuse       reuse;
4891304d26faSStefano Zampini   PetscScalar    m_one = -1.0;
4892304d26faSStefano Zampini   PetscReal      value;
489304708bb6SStefano Zampini   PetscInt       n_D,n_R;
489435529e7bSStefano Zampini   PetscBool      check_corr,issbaij;
4895304d26faSStefano Zampini   PetscErrorCode ierr;
4896e604994aSStefano Zampini   /* prefixes stuff */
4897312be037SStefano Zampini   char           dir_prefix[256],neu_prefix[256],str_level[16];
4898e604994aSStefano Zampini   size_t         len;
4899304d26faSStefano Zampini 
4900304d26faSStefano Zampini   PetscFunctionBegin;
4901304d26faSStefano Zampini 
4902e604994aSStefano Zampini   /* compute prefixes */
4903e604994aSStefano Zampini   ierr = PetscStrcpy(dir_prefix,"");CHKERRQ(ierr);
4904e604994aSStefano Zampini   ierr = PetscStrcpy(neu_prefix,"");CHKERRQ(ierr);
4905e604994aSStefano Zampini   if (!pcbddc->current_level) {
4906e604994aSStefano Zampini     ierr = PetscStrcpy(dir_prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr);
4907e604994aSStefano Zampini     ierr = PetscStrcpy(neu_prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr);
4908e604994aSStefano Zampini     ierr = PetscStrcat(dir_prefix,"pc_bddc_dirichlet_");CHKERRQ(ierr);
4909e604994aSStefano Zampini     ierr = PetscStrcat(neu_prefix,"pc_bddc_neumann_");CHKERRQ(ierr);
4910e604994aSStefano Zampini   } else {
491135529e7bSStefano Zampini     ierr = PetscSNPrintf(str_level,sizeof(str_level),"l%d_",(int)(pcbddc->current_level));CHKERRQ(ierr);
4912e604994aSStefano Zampini     ierr = PetscStrlen(((PetscObject)pc)->prefix,&len);CHKERRQ(ierr);
4913e604994aSStefano Zampini     len -= 15; /* remove "pc_bddc_coarse_" */
4914312be037SStefano Zampini     if (pcbddc->current_level>1) len -= 3; /* remove "lX_" with X level number */
4915312be037SStefano Zampini     if (pcbddc->current_level>10) len -= 1; /* remove another char from level number */
491634d6797cSStefano Zampini     ierr = PetscStrncpy(dir_prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr);
491734d6797cSStefano Zampini     ierr = PetscStrncpy(neu_prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr);
4918e604994aSStefano Zampini     ierr = PetscStrcat(dir_prefix,"pc_bddc_dirichlet_");CHKERRQ(ierr);
4919e604994aSStefano Zampini     ierr = PetscStrcat(neu_prefix,"pc_bddc_neumann_");CHKERRQ(ierr);
4920e604994aSStefano Zampini     ierr = PetscStrcat(dir_prefix,str_level);CHKERRQ(ierr);
4921e604994aSStefano Zampini     ierr = PetscStrcat(neu_prefix,str_level);CHKERRQ(ierr);
4922e604994aSStefano Zampini   }
4923e604994aSStefano Zampini 
4924304d26faSStefano Zampini   /* DIRICHLET PROBLEM */
4925684f6988SStefano Zampini   if (dirichlet) {
4926d5574798SStefano Zampini     PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
4927450f8f5eSStefano Zampini     if (pcbddc->benign_n && !pcbddc->benign_change_explicit) {
49289a962809SStefano Zampini       if (!sub_schurs || !sub_schurs->reuse_solver) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not yet implemented\n");
4929450f8f5eSStefano Zampini       if (pcbddc->dbg_flag) {
4930a3df083aSStefano Zampini         Mat    A_IIn;
4931a3df083aSStefano Zampini 
4932a3df083aSStefano Zampini         ierr = PCBDDCBenignProject(pc,pcis->is_I_local,pcis->is_I_local,&A_IIn);CHKERRQ(ierr);
4933a3df083aSStefano Zampini         ierr = MatDestroy(&pcis->A_II);CHKERRQ(ierr);
4934a3df083aSStefano Zampini         pcis->A_II = A_IIn;
4935a3df083aSStefano Zampini       }
4936450f8f5eSStefano Zampini     }
49373301b35fSStefano Zampini     if (pcbddc->local_mat->symmetric_set) {
49383301b35fSStefano Zampini       ierr = MatSetOption(pcis->A_II,MAT_SYMMETRIC,pcbddc->local_mat->symmetric_set);CHKERRQ(ierr);
4939964fefecSStefano Zampini     }
4940ac78edfcSStefano Zampini     /* Matrix for Dirichlet problem is pcis->A_II */
4941964fefecSStefano Zampini     n_D = pcis->n - pcis->n_B;
4942304d26faSStefano Zampini     if (!pcbddc->ksp_D) { /* create object if not yet build */
4943304d26faSStefano Zampini       ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
4944304d26faSStefano Zampini       ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
4945304d26faSStefano Zampini       /* default */
4946304d26faSStefano Zampini       ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
4947e604994aSStefano Zampini       ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,dir_prefix);CHKERRQ(ierr);
49489577ea80SStefano Zampini       ierr = PetscObjectTypeCompare((PetscObject)pcis->A_II,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr);
4949304d26faSStefano Zampini       ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
49509577ea80SStefano Zampini       if (issbaij) {
49519577ea80SStefano Zampini         ierr = PCSetType(pc_temp,PCCHOLESKY);CHKERRQ(ierr);
49529577ea80SStefano Zampini       } else {
4953304d26faSStefano Zampini         ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
49549577ea80SStefano Zampini       }
4955304d26faSStefano Zampini       /* Allow user's customization */
4956304d26faSStefano Zampini       ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
4957304d26faSStefano Zampini       ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr);
4958304d26faSStefano Zampini     }
4959d1e9a80fSBarry Smith     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II);CHKERRQ(ierr);
4960b334f244SStefano Zampini     if (sub_schurs && sub_schurs->reuse_solver) {
4961df4d28bfSStefano Zampini       PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
4962d62866d3SStefano Zampini 
4963df4d28bfSStefano Zampini       ierr = KSPSetPC(pcbddc->ksp_D,reuse_solver->interior_solver);CHKERRQ(ierr);
4964d5574798SStefano Zampini     }
4965304d26faSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero. TODO solve from umfpack interface */
4966304d26faSStefano Zampini     if (!n_D) {
4967304d26faSStefano Zampini       ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
4968304d26faSStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
4969304d26faSStefano Zampini     }
4970304d26faSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
4971304d26faSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
4972304d26faSStefano Zampini     /* set ksp_D into pcis data */
4973304d26faSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
4974304d26faSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
4975304d26faSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
4976684f6988SStefano Zampini   }
4977304d26faSStefano Zampini 
4978304d26faSStefano Zampini   /* NEUMANN PROBLEM */
4979684f6988SStefano Zampini   A_RR = 0;
4980684f6988SStefano Zampini   if (neumann) {
4981d62866d3SStefano Zampini     PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
498204708bb6SStefano Zampini     PetscInt        ibs,mbs;
49830aa714b2SStefano Zampini     PetscBool       issbaij, reuse_neumann_solver;
498404708bb6SStefano Zampini     Mat_IS*         matis = (Mat_IS*)pc->pmat->data;
49850aa714b2SStefano Zampini 
49860aa714b2SStefano Zampini     reuse_neumann_solver = PETSC_FALSE;
49870aa714b2SStefano Zampini     if (sub_schurs && sub_schurs->reuse_solver) {
49880aa714b2SStefano Zampini       IS iP;
49890aa714b2SStefano Zampini 
49900aa714b2SStefano Zampini       reuse_neumann_solver = PETSC_TRUE;
49910aa714b2SStefano Zampini       ierr = PetscObjectQuery((PetscObject)sub_schurs->A,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr);
49920aa714b2SStefano Zampini       if (iP) reuse_neumann_solver = PETSC_FALSE;
49930aa714b2SStefano Zampini     }
4994f4ddd8eeSStefano Zampini     /* Matrix for Neumann problem is A_RR -> we need to create/reuse it at this point */
49958ce42a96SStefano Zampini     ierr = ISGetSize(pcbddc->is_R_local,&n_R);CHKERRQ(ierr);
4996f4ddd8eeSStefano Zampini     if (pcbddc->ksp_R) { /* already created ksp */
4997f4ddd8eeSStefano Zampini       PetscInt nn_R;
499881d9aea3SBarry Smith       ierr = KSPGetOperators(pcbddc->ksp_R,NULL,&A_RR);CHKERRQ(ierr);
4999f4ddd8eeSStefano Zampini       ierr = PetscObjectReference((PetscObject)A_RR);CHKERRQ(ierr);
5000f4ddd8eeSStefano Zampini       ierr = MatGetSize(A_RR,&nn_R,NULL);CHKERRQ(ierr);
5001f4ddd8eeSStefano Zampini       if (nn_R != n_R) { /* old ksp is not reusable, so reset it */
5002f4ddd8eeSStefano Zampini         ierr = KSPReset(pcbddc->ksp_R);CHKERRQ(ierr);
5003f4ddd8eeSStefano Zampini         ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
5004f4ddd8eeSStefano Zampini         reuse = MAT_INITIAL_MATRIX;
5005f4ddd8eeSStefano Zampini       } else { /* same sizes, but nonzero pattern depend on primal vertices so it can be changed */
5006727cdba6SStefano Zampini         if (pcbddc->new_primal_space_local) { /* we are not sure the matrix will have the same nonzero pattern */
5007f4ddd8eeSStefano Zampini           ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
5008f4ddd8eeSStefano Zampini           reuse = MAT_INITIAL_MATRIX;
5009f4ddd8eeSStefano Zampini         } else { /* safe to reuse the matrix */
5010f4ddd8eeSStefano Zampini           reuse = MAT_REUSE_MATRIX;
5011f4ddd8eeSStefano Zampini         }
5012f4ddd8eeSStefano Zampini       }
5013f4ddd8eeSStefano Zampini       /* last check */
5014d1e9a80fSBarry Smith       if (pc->flag == DIFFERENT_NONZERO_PATTERN) {
5015f4ddd8eeSStefano Zampini         ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
5016f4ddd8eeSStefano Zampini         reuse = MAT_INITIAL_MATRIX;
5017f4ddd8eeSStefano Zampini       }
5018f4ddd8eeSStefano Zampini     } else { /* first time, so we need to create the matrix */
5019f4ddd8eeSStefano Zampini       reuse = MAT_INITIAL_MATRIX;
5020f4ddd8eeSStefano Zampini     }
5021a00504b5SStefano Zampini     /* convert pcbddc->local_mat if needed later in PCBDDCSetUpCorrection */
5022af732b37SStefano Zampini     ierr = MatGetBlockSize(pcbddc->local_mat,&mbs);CHKERRQ(ierr);
5023af732b37SStefano Zampini     ierr = ISGetBlockSize(pcbddc->is_R_local,&ibs);CHKERRQ(ierr);
502404708bb6SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pcbddc->local_mat,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr);
502504708bb6SStefano Zampini     if (ibs != mbs) { /* need to convert to SEQAIJ to extract any submatrix with is_R_local */
502604708bb6SStefano Zampini       if (matis->A == pcbddc->local_mat) {
502704708bb6SStefano Zampini         ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
502804708bb6SStefano Zampini         ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr);
5029af732b37SStefano Zampini       } else {
5030511c6705SHong Zhang         ierr = MatConvert(pcbddc->local_mat,MATSEQAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr);
50316816873aSStefano Zampini       }
503204708bb6SStefano Zampini     } else if (issbaij) { /* need to convert to BAIJ to get offdiagonal blocks */
503304708bb6SStefano Zampini       if (matis->A == pcbddc->local_mat) {
503404708bb6SStefano Zampini         ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
503504708bb6SStefano Zampini         ierr = MatConvert(matis->A,MATSEQBAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr);
503604708bb6SStefano Zampini       } else {
5037511c6705SHong Zhang         ierr = MatConvert(pcbddc->local_mat,MATSEQBAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr);
503804708bb6SStefano Zampini       }
503904708bb6SStefano Zampini     }
5040a00504b5SStefano Zampini     /* extract A_RR */
50410aa714b2SStefano Zampini     if (reuse_neumann_solver) {
5042a00504b5SStefano Zampini       PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
5043a00504b5SStefano Zampini 
5044a00504b5SStefano Zampini       if (pcbddc->dbg_flag) { /* we need A_RR to test the solver later */
504516e386b8SStefano Zampini         ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
5046a00504b5SStefano Zampini         if (reuse_solver->benign_n) { /* we are not using the explicit change of basis on the pressures */
504716e386b8SStefano Zampini           ierr = PCBDDCBenignProject(pc,pcbddc->is_R_local,pcbddc->is_R_local,&A_RR);CHKERRQ(ierr);
504816e386b8SStefano Zampini         } else {
50497dae84e0SHong Zhang           ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
5050a00504b5SStefano Zampini         }
5051a00504b5SStefano Zampini       } else {
5052a00504b5SStefano Zampini         ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
5053a00504b5SStefano Zampini         ierr = PCGetOperators(reuse_solver->correction_solver,&A_RR,NULL);CHKERRQ(ierr);
5054a00504b5SStefano Zampini         ierr = PetscObjectReference((PetscObject)A_RR);CHKERRQ(ierr);
5055a00504b5SStefano Zampini       }
5056a00504b5SStefano Zampini     } else { /* we have to build the neumann solver, so we need to extract the relevant matrix */
50577dae84e0SHong Zhang       ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,pcbddc->is_R_local,reuse,&A_RR);CHKERRQ(ierr);
505816e386b8SStefano Zampini     }
50593301b35fSStefano Zampini     if (pcbddc->local_mat->symmetric_set) {
50603301b35fSStefano Zampini       ierr = MatSetOption(A_RR,MAT_SYMMETRIC,pcbddc->local_mat->symmetric_set);CHKERRQ(ierr);
50616816873aSStefano Zampini     }
5062f4ddd8eeSStefano Zampini     if (!pcbddc->ksp_R) { /* create object if not present */
5063304d26faSStefano Zampini       ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
5064304d26faSStefano Zampini       ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
5065304d26faSStefano Zampini       /* default */
5066304d26faSStefano Zampini       ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
5067e604994aSStefano Zampini       ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,neu_prefix);CHKERRQ(ierr);
5068304d26faSStefano Zampini       ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
50699577ea80SStefano Zampini       ierr = PetscObjectTypeCompare((PetscObject)A_RR,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr);
50709577ea80SStefano Zampini       if (issbaij) {
50719577ea80SStefano Zampini         ierr = PCSetType(pc_temp,PCCHOLESKY);CHKERRQ(ierr);
50729577ea80SStefano Zampini       } else {
5073304d26faSStefano Zampini         ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
50749577ea80SStefano Zampini       }
5075304d26faSStefano Zampini       /* Allow user's customization */
5076304d26faSStefano Zampini       ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
5077304d26faSStefano Zampini       ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr);
5078304d26faSStefano Zampini     }
5079304d26faSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero. TODO solve from umfpack interface */
5080304d26faSStefano Zampini     if (!n_R) {
5081304d26faSStefano Zampini       ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
5082304d26faSStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
5083304d26faSStefano Zampini     }
50845cbda25cSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR);CHKERRQ(ierr);
5085df4d28bfSStefano Zampini     /* Reuse solver if it is present */
50860aa714b2SStefano Zampini     if (reuse_neumann_solver) {
5087df4d28bfSStefano Zampini       PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
5088d62866d3SStefano Zampini 
5089df4d28bfSStefano Zampini       ierr = KSPSetPC(pcbddc->ksp_R,reuse_solver->correction_solver);CHKERRQ(ierr);
5090d62866d3SStefano Zampini     }
5091304d26faSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
5092304d26faSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
5093684f6988SStefano Zampini   }
5094304d26faSStefano Zampini 
5095684f6988SStefano Zampini   if (pcbddc->dbg_flag) {
5096684f6988SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
50971575c14dSBarry Smith     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
5098684f6988SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
5099684f6988SStefano Zampini   }
5100c7017625SStefano Zampini 
5101c7017625SStefano Zampini   /* adapt Dirichlet and Neumann solvers if a nullspace correction has been requested */
510235529e7bSStefano Zampini   check_corr = PETSC_FALSE;
5103c7017625SStefano Zampini   if (pcbddc->NullSpace_corr[0]) {
5104c7017625SStefano Zampini     ierr = PCBDDCSetUseExactDirichlet(pc,PETSC_FALSE);CHKERRQ(ierr);
5105c7017625SStefano Zampini   }
5106c7017625SStefano Zampini   if (dirichlet && pcbddc->NullSpace_corr[0] && !pcbddc->switch_static) {
510735529e7bSStefano Zampini     check_corr = PETSC_TRUE;
5108c7017625SStefano Zampini     ierr = PCBDDCNullSpaceAssembleCorrection(pc,PETSC_TRUE,pcbddc->NullSpace_corr[1]);CHKERRQ(ierr);
5109c7017625SStefano Zampini   }
5110c7017625SStefano Zampini   if (neumann && pcbddc->NullSpace_corr[2]) {
511135529e7bSStefano Zampini     check_corr = PETSC_TRUE;
5112c7017625SStefano Zampini     ierr = PCBDDCNullSpaceAssembleCorrection(pc,PETSC_FALSE,pcbddc->NullSpace_corr[3]);CHKERRQ(ierr);
5113c7017625SStefano Zampini   }
5114c7017625SStefano Zampini   /* check Dirichlet and Neumann solvers */
5115c7017625SStefano Zampini   if (pcbddc->dbg_flag) {
5116684f6988SStefano Zampini     if (dirichlet) { /* Dirichlet */
51170fccc4e9SStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,NULL);CHKERRQ(ierr);
51180fccc4e9SStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
51190fccc4e9SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,pcis->vec2_D);CHKERRQ(ierr);
51200fccc4e9SStefano Zampini       ierr = VecAXPY(pcis->vec1_D,m_one,pcis->vec2_D);CHKERRQ(ierr);
51210fccc4e9SStefano Zampini       ierr = VecNorm(pcis->vec1_D,NORM_INFINITY,&value);CHKERRQ(ierr);
5122e604994aSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d infinity error for Dirichlet solve (%s) = % 1.14e \n",PetscGlobalRank,((PetscObject)(pcbddc->ksp_D))->prefix,value);CHKERRQ(ierr);
512335529e7bSStefano Zampini       if (check_corr) {
5124c7017625SStefano Zampini         ierr = PCBDDCNullSpaceCheckCorrection(pc,PETSC_TRUE);CHKERRQ(ierr);
5125c7017625SStefano Zampini       }
5126304d26faSStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
5127304d26faSStefano Zampini     }
5128684f6988SStefano Zampini     if (neumann) { /* Neumann */
51290fccc4e9SStefano Zampini       ierr = VecSetRandom(pcbddc->vec1_R,NULL);CHKERRQ(ierr);
51300fccc4e9SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
51310fccc4e9SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
51320fccc4e9SStefano Zampini       ierr = VecAXPY(pcbddc->vec1_R,m_one,pcbddc->vec2_R);CHKERRQ(ierr);
51330fccc4e9SStefano Zampini       ierr = VecNorm(pcbddc->vec1_R,NORM_INFINITY,&value);CHKERRQ(ierr);
5134e604994aSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d infinity error for Neumann solve (%s) = % 1.14e\n",PetscGlobalRank,((PetscObject)(pcbddc->ksp_R))->prefix,value);CHKERRQ(ierr);
513535529e7bSStefano Zampini       if (check_corr) {
5136c7017625SStefano Zampini         ierr = PCBDDCNullSpaceCheckCorrection(pc,PETSC_FALSE);CHKERRQ(ierr);
5137c7017625SStefano Zampini       }
5138304d26faSStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
5139304d26faSStefano Zampini     }
5140684f6988SStefano Zampini   }
51415cbda25cSStefano Zampini   /* free Neumann problem's matrix */
51425cbda25cSStefano Zampini   ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
5143304d26faSStefano Zampini   PetscFunctionReturn(0);
5144304d26faSStefano Zampini }
5145304d26faSStefano Zampini 
514680677318SStefano Zampini static PetscErrorCode  PCBDDCSolveSubstructureCorrection(PC pc, Vec inout_B, Vec inout_D, PetscBool applytranspose)
5147674ae819SStefano Zampini {
5148674ae819SStefano Zampini   PetscErrorCode  ierr;
5149674ae819SStefano Zampini   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
5150be83ff47SStefano Zampini   PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
5151b334f244SStefano Zampini   PetscBool       reuse_solver = sub_schurs ? ( sub_schurs->reuse_solver ? PETSC_TRUE : PETSC_FALSE ) : PETSC_FALSE;
5152674ae819SStefano Zampini 
5153674ae819SStefano Zampini   PetscFunctionBegin;
5154b334f244SStefano Zampini   if (!reuse_solver) {
515580677318SStefano Zampini     ierr = VecSet(pcbddc->vec1_R,0.);CHKERRQ(ierr);
515620c7b377SStefano Zampini   }
515780677318SStefano Zampini   if (!pcbddc->switch_static) {
515880677318SStefano Zampini     if (applytranspose && pcbddc->local_auxmat1) {
515980677318SStefano Zampini       ierr = MatMultTranspose(pcbddc->local_auxmat2,inout_B,pcbddc->vec1_C);CHKERRQ(ierr);
516080677318SStefano Zampini       ierr = MatMultTransposeAdd(pcbddc->local_auxmat1,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr);
516120c7b377SStefano Zampini     }
5162b334f244SStefano Zampini     if (!reuse_solver) {
516380677318SStefano Zampini       ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
516480677318SStefano Zampini       ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
516520c7b377SStefano Zampini     } else {
5166df4d28bfSStefano Zampini       PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
5167be83ff47SStefano Zampini 
5168df4d28bfSStefano Zampini       ierr = VecScatterBegin(reuse_solver->correction_scatter_B,inout_B,reuse_solver->rhs_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5169df4d28bfSStefano Zampini       ierr = VecScatterEnd(reuse_solver->correction_scatter_B,inout_B,reuse_solver->rhs_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
517020c7b377SStefano Zampini     }
5171be83ff47SStefano Zampini   } else {
517280677318SStefano Zampini     ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
517380677318SStefano Zampini     ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
517480677318SStefano Zampini     ierr = VecScatterBegin(pcbddc->R_to_D,inout_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
517580677318SStefano Zampini     ierr = VecScatterEnd(pcbddc->R_to_D,inout_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
517680677318SStefano Zampini     if (applytranspose && pcbddc->local_auxmat1) {
517780677318SStefano Zampini       ierr = MatMultTranspose(pcbddc->local_auxmat2,pcbddc->vec1_R,pcbddc->vec1_C);CHKERRQ(ierr);
517880677318SStefano Zampini       ierr = MatMultTransposeAdd(pcbddc->local_auxmat1,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr);
517980677318SStefano Zampini       ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
518080677318SStefano Zampini       ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5181674ae819SStefano Zampini     }
5182674ae819SStefano Zampini   }
5183b334f244SStefano Zampini   if (!reuse_solver || pcbddc->switch_static) {
518480677318SStefano Zampini     if (applytranspose) {
518580677318SStefano Zampini       ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
518680677318SStefano Zampini     } else {
518780677318SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
518880677318SStefano Zampini     }
5189be83ff47SStefano Zampini   } else {
5190df4d28bfSStefano Zampini     PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
5191be83ff47SStefano Zampini 
5192be83ff47SStefano Zampini     if (applytranspose) {
5193df4d28bfSStefano Zampini       ierr = MatFactorSolveSchurComplementTranspose(reuse_solver->F,reuse_solver->rhs_B,reuse_solver->sol_B);CHKERRQ(ierr);
5194be83ff47SStefano Zampini     } else {
5195df4d28bfSStefano Zampini       ierr = MatFactorSolveSchurComplement(reuse_solver->F,reuse_solver->rhs_B,reuse_solver->sol_B);CHKERRQ(ierr);
5196be83ff47SStefano Zampini     }
5197be83ff47SStefano Zampini   }
519880677318SStefano Zampini   ierr = VecSet(inout_B,0.);CHKERRQ(ierr);
519980677318SStefano Zampini   if (!pcbddc->switch_static) {
5200b334f244SStefano Zampini     if (!reuse_solver) {
520180677318SStefano Zampini       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
520280677318SStefano Zampini       ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5203be83ff47SStefano Zampini     } else {
5204df4d28bfSStefano Zampini       PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver;
5205be83ff47SStefano Zampini 
5206df4d28bfSStefano Zampini       ierr = VecScatterBegin(reuse_solver->correction_scatter_B,reuse_solver->sol_B,inout_B,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5207df4d28bfSStefano Zampini       ierr = VecScatterEnd(reuse_solver->correction_scatter_B,reuse_solver->sol_B,inout_B,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5208be83ff47SStefano Zampini     }
520980677318SStefano Zampini     if (!applytranspose && pcbddc->local_auxmat1) {
521080677318SStefano Zampini       ierr = MatMult(pcbddc->local_auxmat1,inout_B,pcbddc->vec1_C);CHKERRQ(ierr);
521180677318SStefano Zampini       ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr);
521280677318SStefano Zampini     }
521380677318SStefano Zampini   } else {
521480677318SStefano Zampini     ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
521580677318SStefano Zampini     ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
521680677318SStefano Zampini     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
521780677318SStefano Zampini     ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
521880677318SStefano Zampini     if (!applytranspose && pcbddc->local_auxmat1) {
521980677318SStefano Zampini       ierr = MatMult(pcbddc->local_auxmat1,inout_B,pcbddc->vec1_C);CHKERRQ(ierr);
522080677318SStefano Zampini       ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
522180677318SStefano Zampini     }
522280677318SStefano Zampini     ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
522380677318SStefano Zampini     ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
522480677318SStefano Zampini     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
522580677318SStefano Zampini     ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5226674ae819SStefano Zampini   }
5227674ae819SStefano Zampini   PetscFunctionReturn(0);
5228674ae819SStefano Zampini }
5229674ae819SStefano Zampini 
5230dc359a40SStefano Zampini /* parameter apply transpose determines if the interface preconditioner should be applied transposed or not */
5231dc359a40SStefano Zampini PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc, PetscBool applytranspose)
5232674ae819SStefano Zampini {
5233674ae819SStefano Zampini   PetscErrorCode ierr;
5234674ae819SStefano Zampini   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
5235674ae819SStefano Zampini   PC_IS*            pcis = (PC_IS*)  (pc->data);
5236674ae819SStefano Zampini   const PetscScalar zero = 0.0;
5237674ae819SStefano Zampini 
5238674ae819SStefano Zampini   PetscFunctionBegin;
5239dc359a40SStefano Zampini   /* Application of PSI^T or PHI^T (depending on applytranspose, see comment above) */
52404fee134fSStefano Zampini   if (!pcbddc->benign_apply_coarse_only) {
5241dc359a40SStefano Zampini     if (applytranspose) {
5242674ae819SStefano Zampini       ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
52438eeda7d8SStefano Zampini       if (pcbddc->switch_static) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
5244dc359a40SStefano Zampini     } else {
5245674ae819SStefano Zampini       ierr = MatMultTranspose(pcbddc->coarse_psi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
5246674ae819SStefano Zampini       if (pcbddc->switch_static) { ierr = MatMultTransposeAdd(pcbddc->coarse_psi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
524715aaf578SStefano Zampini     }
52484fee134fSStefano Zampini   } else {
52494fee134fSStefano Zampini     ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
52504fee134fSStefano Zampini   }
5251efc2fbd9SStefano Zampini 
5252efc2fbd9SStefano Zampini   /* add p0 to the last value of vec1_P holding the coarse dof relative to p0 */
52534f1b2e48SStefano Zampini   if (pcbddc->benign_n) {
5254efc2fbd9SStefano Zampini     PetscScalar *array;
52554f1b2e48SStefano Zampini     PetscInt    j;
5256efc2fbd9SStefano Zampini 
5257efc2fbd9SStefano Zampini     ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
52584f1b2e48SStefano Zampini     for (j=0;j<pcbddc->benign_n;j++) array[pcbddc->local_primal_size-pcbddc->benign_n+j] += pcbddc->benign_p0[j];
5259efc2fbd9SStefano Zampini     ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
5260efc2fbd9SStefano Zampini   }
5261efc2fbd9SStefano Zampini 
526212edc857SStefano Zampini   /* start communications from local primal nodes to rhs of coarse solver */
526312edc857SStefano Zampini   ierr = VecSet(pcbddc->coarse_vec,zero);CHKERRQ(ierr);
526412edc857SStefano Zampini   ierr = PCBDDCScatterCoarseDataBegin(pc,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
526512edc857SStefano Zampini   ierr = PCBDDCScatterCoarseDataEnd(pc,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
526612edc857SStefano Zampini 
52679f00e9b4SStefano Zampini   /* Coarse solution -> rhs and sol updated inside PCBDDCScattarCoarseDataBegin/End */
526812edc857SStefano Zampini   if (pcbddc->coarse_ksp) {
526951694757SStefano Zampini     Mat          coarse_mat;
5270964fefecSStefano Zampini     Vec          rhs,sol;
527151694757SStefano Zampini     MatNullSpace nullsp;
527227b6a85dSStefano Zampini     PetscBool    isbddc = PETSC_FALSE;
5273964fefecSStefano Zampini 
527427b6a85dSStefano Zampini     if (pcbddc->benign_have_null) {
527527b6a85dSStefano Zampini       PC        coarse_pc;
527627b6a85dSStefano Zampini 
527727b6a85dSStefano Zampini       ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr);
527827b6a85dSStefano Zampini       ierr = PetscObjectTypeCompare((PetscObject)coarse_pc,PCBDDC,&isbddc);CHKERRQ(ierr);
527927b6a85dSStefano Zampini       /* we need to propagate to coarser levels the need for a possible benign correction */
528027b6a85dSStefano Zampini       if (isbddc && pcbddc->benign_apply_coarse_only && !pcbddc->benign_skip_correction) {
528127b6a85dSStefano Zampini         PC_BDDC* coarsepcbddc = (PC_BDDC*)(coarse_pc->data);
528227b6a85dSStefano Zampini         coarsepcbddc->benign_skip_correction = PETSC_FALSE;
52833bca92a6SStefano Zampini         coarsepcbddc->benign_apply_coarse_only = PETSC_TRUE;
528427b6a85dSStefano Zampini       }
528527b6a85dSStefano Zampini     }
5286964fefecSStefano Zampini     ierr = KSPGetRhs(pcbddc->coarse_ksp,&rhs);CHKERRQ(ierr);
5287964fefecSStefano Zampini     ierr = KSPGetSolution(pcbddc->coarse_ksp,&sol);CHKERRQ(ierr);
528851694757SStefano Zampini     ierr = KSPGetOperators(pcbddc->coarse_ksp,&coarse_mat,NULL);CHKERRQ(ierr);
528951694757SStefano Zampini     ierr = MatGetNullSpace(coarse_mat,&nullsp);CHKERRQ(ierr);
529051694757SStefano Zampini     if (nullsp) {
529151694757SStefano Zampini       ierr = MatNullSpaceRemove(nullsp,rhs);CHKERRQ(ierr);
529251694757SStefano Zampini     }
529312edc857SStefano Zampini     if (applytranspose) {
52949a962809SStefano Zampini       if (pcbddc->benign_apply_coarse_only) SETERRQ(PetscObjectComm((PetscObject)pcbddc->coarse_ksp),PETSC_ERR_SUP,"Not yet implemented");
5295964fefecSStefano Zampini       ierr = KSPSolveTranspose(pcbddc->coarse_ksp,rhs,sol);CHKERRQ(ierr);
52962701bc32SStefano Zampini     } else {
52971f4df5f7SStefano Zampini       if (pcbddc->benign_apply_coarse_only && isbddc) { /* need just to apply the coarse preconditioner during presolve */
52982701bc32SStefano Zampini         PC        coarse_pc;
52992701bc32SStefano Zampini 
53002701bc32SStefano Zampini         ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr);
53012701bc32SStefano Zampini         ierr = PCPreSolve(coarse_pc,pcbddc->coarse_ksp);CHKERRQ(ierr);
53023e589ea0SStefano Zampini         ierr = PCBDDCBenignRemoveInterior(coarse_pc,rhs,sol);CHKERRQ(ierr);
53032701bc32SStefano Zampini         ierr = PCPostSolve(coarse_pc,pcbddc->coarse_ksp);CHKERRQ(ierr);
530412edc857SStefano Zampini       } else {
5305964fefecSStefano Zampini         ierr = KSPSolve(pcbddc->coarse_ksp,rhs,sol);CHKERRQ(ierr);
530612edc857SStefano Zampini       }
53072701bc32SStefano Zampini     }
53081d82a3b6SStefano Zampini     /* we don't need the benign correction at coarser levels anymore */
530927b6a85dSStefano Zampini     if (pcbddc->benign_have_null && isbddc) {
531027b6a85dSStefano Zampini       PC        coarse_pc;
531127b6a85dSStefano Zampini       PC_BDDC*  coarsepcbddc;
531227b6a85dSStefano Zampini 
531327b6a85dSStefano Zampini       ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr);
531427b6a85dSStefano Zampini       coarsepcbddc = (PC_BDDC*)(coarse_pc->data);
531527b6a85dSStefano Zampini       coarsepcbddc->benign_skip_correction = PETSC_TRUE;
53163bca92a6SStefano Zampini       coarsepcbddc->benign_apply_coarse_only = PETSC_FALSE;
531727b6a85dSStefano Zampini     }
531851694757SStefano Zampini     if (nullsp) {
531951694757SStefano Zampini       ierr = MatNullSpaceRemove(nullsp,sol);CHKERRQ(ierr);
532051694757SStefano Zampini     }
532112edc857SStefano Zampini   }
5322674ae819SStefano Zampini 
5323674ae819SStefano Zampini   /* Local solution on R nodes */
53244fee134fSStefano Zampini   if (pcis->n && !pcbddc->benign_apply_coarse_only) {
532580677318SStefano Zampini     ierr = PCBDDCSolveSubstructureCorrection(pc,pcis->vec1_B,pcis->vec1_D,applytranspose);CHKERRQ(ierr);
53269f00e9b4SStefano Zampini   }
53279f00e9b4SStefano Zampini   /* communications from coarse sol to local primal nodes */
53289f00e9b4SStefano Zampini   ierr = PCBDDCScatterCoarseDataBegin(pc,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
532912edc857SStefano Zampini   ierr = PCBDDCScatterCoarseDataEnd(pc,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5330674ae819SStefano Zampini 
53314fee134fSStefano Zampini   /* Sum contributions from the two levels */
53324fee134fSStefano Zampini   if (!pcbddc->benign_apply_coarse_only) {
5333dc359a40SStefano Zampini     if (applytranspose) {
5334dc359a40SStefano Zampini       ierr = MatMultAdd(pcbddc->coarse_psi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
5335dc359a40SStefano Zampini       if (pcbddc->switch_static) { ierr = MatMultAdd(pcbddc->coarse_psi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
5336dc359a40SStefano Zampini     } else {
5337674ae819SStefano Zampini       ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
53388eeda7d8SStefano Zampini       if (pcbddc->switch_static) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
5339dc359a40SStefano Zampini     }
5340efc2fbd9SStefano Zampini     /* store p0 */
53414f1b2e48SStefano Zampini     if (pcbddc->benign_n) {
5342efc2fbd9SStefano Zampini       PetscScalar *array;
53434f1b2e48SStefano Zampini       PetscInt    j;
5344efc2fbd9SStefano Zampini 
5345efc2fbd9SStefano Zampini       ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
53464f1b2e48SStefano Zampini       for (j=0;j<pcbddc->benign_n;j++) pcbddc->benign_p0[j] = array[pcbddc->local_primal_size-pcbddc->benign_n+j];
5347efc2fbd9SStefano Zampini       ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
5348efc2fbd9SStefano Zampini     }
53494fee134fSStefano Zampini   } else { /* expand the coarse solution */
53504fee134fSStefano Zampini     if (applytranspose) {
53514fee134fSStefano Zampini       ierr = MatMult(pcbddc->coarse_psi_B,pcbddc->vec1_P,pcis->vec1_B);CHKERRQ(ierr);
53524fee134fSStefano Zampini     } else {
53534fee134fSStefano Zampini       ierr = MatMult(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B);CHKERRQ(ierr);
53544fee134fSStefano Zampini     }
53554fee134fSStefano Zampini   }
5356674ae819SStefano Zampini   PetscFunctionReturn(0);
5357674ae819SStefano Zampini }
5358674ae819SStefano Zampini 
535912edc857SStefano Zampini PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,InsertMode imode, ScatterMode smode)
5360674ae819SStefano Zampini {
5361674ae819SStefano Zampini   PetscErrorCode ierr;
5362674ae819SStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
536358da7f69SStefano Zampini   PetscScalar    *array;
536412edc857SStefano Zampini   Vec            from,to;
5365674ae819SStefano Zampini 
5366674ae819SStefano Zampini   PetscFunctionBegin;
536712edc857SStefano Zampini   if (smode == SCATTER_REVERSE) { /* from global to local -> get data from coarse solution */
536812edc857SStefano Zampini     from = pcbddc->coarse_vec;
536912edc857SStefano Zampini     to = pcbddc->vec1_P;
537012edc857SStefano Zampini     if (pcbddc->coarse_ksp) { /* get array from coarse processes */
537112edc857SStefano Zampini       Vec tvec;
537258da7f69SStefano Zampini 
537358da7f69SStefano Zampini       ierr = KSPGetRhs(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr);
537458da7f69SStefano Zampini       ierr = VecResetArray(tvec);CHKERRQ(ierr);
537512edc857SStefano Zampini       ierr = KSPGetSolution(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr);
537658da7f69SStefano Zampini       ierr = VecGetArray(tvec,&array);CHKERRQ(ierr);
537758da7f69SStefano Zampini       ierr = VecPlaceArray(from,array);CHKERRQ(ierr);
537858da7f69SStefano Zampini       ierr = VecRestoreArray(tvec,&array);CHKERRQ(ierr);
537912edc857SStefano Zampini     }
538012edc857SStefano Zampini   } else { /* from local to global -> put data in coarse right hand side */
538112edc857SStefano Zampini     from = pcbddc->vec1_P;
538212edc857SStefano Zampini     to = pcbddc->coarse_vec;
538312edc857SStefano Zampini   }
538412edc857SStefano Zampini   ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,from,to,imode,smode);CHKERRQ(ierr);
5385674ae819SStefano Zampini   PetscFunctionReturn(0);
5386674ae819SStefano Zampini }
5387674ae819SStefano Zampini 
538812edc857SStefano Zampini PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc, InsertMode imode, ScatterMode smode)
5389674ae819SStefano Zampini {
5390674ae819SStefano Zampini   PetscErrorCode ierr;
5391674ae819SStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
539258da7f69SStefano Zampini   PetscScalar    *array;
539312edc857SStefano Zampini   Vec            from,to;
5394674ae819SStefano Zampini 
5395674ae819SStefano Zampini   PetscFunctionBegin;
539612edc857SStefano Zampini   if (smode == SCATTER_REVERSE) { /* from global to local -> get data from coarse solution */
539712edc857SStefano Zampini     from = pcbddc->coarse_vec;
539812edc857SStefano Zampini     to = pcbddc->vec1_P;
539912edc857SStefano Zampini   } else { /* from local to global -> put data in coarse right hand side */
540012edc857SStefano Zampini     from = pcbddc->vec1_P;
540112edc857SStefano Zampini     to = pcbddc->coarse_vec;
540212edc857SStefano Zampini   }
540312edc857SStefano Zampini   ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,from,to,imode,smode);CHKERRQ(ierr);
540412edc857SStefano Zampini   if (smode == SCATTER_FORWARD) {
540512edc857SStefano Zampini     if (pcbddc->coarse_ksp) { /* get array from coarse processes */
540612edc857SStefano Zampini       Vec tvec;
540758da7f69SStefano Zampini 
540812edc857SStefano Zampini       ierr = KSPGetRhs(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr);
540958da7f69SStefano Zampini       ierr = VecGetArray(to,&array);CHKERRQ(ierr);
541058da7f69SStefano Zampini       ierr = VecPlaceArray(tvec,array);CHKERRQ(ierr);
541158da7f69SStefano Zampini       ierr = VecRestoreArray(to,&array);CHKERRQ(ierr);
541258da7f69SStefano Zampini     }
541358da7f69SStefano Zampini   } else {
541458da7f69SStefano Zampini     if (pcbddc->coarse_ksp) { /* restore array of pcbddc->coarse_vec */
541558da7f69SStefano Zampini      ierr = VecResetArray(from);CHKERRQ(ierr);
541612edc857SStefano Zampini     }
541712edc857SStefano Zampini   }
5418674ae819SStefano Zampini   PetscFunctionReturn(0);
5419674ae819SStefano Zampini }
5420674ae819SStefano Zampini 
5421984c4197SStefano Zampini /* uncomment for testing purposes */
5422984c4197SStefano Zampini /* #define PETSC_MISSING_LAPACK_GESVD 1 */
5423674ae819SStefano Zampini PetscErrorCode PCBDDCConstraintsSetUp(PC pc)
5424674ae819SStefano Zampini {
5425674ae819SStefano Zampini   PetscErrorCode    ierr;
5426674ae819SStefano Zampini   PC_IS*            pcis = (PC_IS*)(pc->data);
5427674ae819SStefano Zampini   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
5428674ae819SStefano Zampini   Mat_IS*           matis = (Mat_IS*)pc->pmat->data;
5429984c4197SStefano Zampini   /* one and zero */
5430984c4197SStefano Zampini   PetscScalar       one=1.0,zero=0.0;
5431984c4197SStefano Zampini   /* space to store constraints and their local indices */
54329162d606SStefano Zampini   PetscScalar       *constraints_data;
54339162d606SStefano Zampini   PetscInt          *constraints_idxs,*constraints_idxs_B;
54349162d606SStefano Zampini   PetscInt          *constraints_idxs_ptr,*constraints_data_ptr;
54359162d606SStefano Zampini   PetscInt          *constraints_n;
5436984c4197SStefano Zampini   /* iterators */
5437b3d85658SStefano Zampini   PetscInt          i,j,k,total_counts,total_counts_cc,cum;
5438984c4197SStefano Zampini   /* BLAS integers */
5439e310c8b4SStefano Zampini   PetscBLASInt      lwork,lierr;
5440e310c8b4SStefano Zampini   PetscBLASInt      Blas_N,Blas_M,Blas_K,Blas_one=1;
5441c4303822SStefano Zampini   PetscBLASInt      Blas_LDA,Blas_LDB,Blas_LDC;
5442727cdba6SStefano Zampini   /* reuse */
54430e6343abSStefano Zampini   PetscInt          olocal_primal_size,olocal_primal_size_cc;
54440e6343abSStefano Zampini   PetscInt          *olocal_primal_ref_node,*olocal_primal_ref_mult;
5445984c4197SStefano Zampini   /* change of basis */
5446b3d85658SStefano Zampini   PetscBool         qr_needed;
54479162d606SStefano Zampini   PetscBT           change_basis,qr_needed_idx;
5448984c4197SStefano Zampini   /* auxiliary stuff */
544964efe560SStefano Zampini   PetscInt          *nnz,*is_indices;
54508a0068c3SStefano Zampini   PetscInt          ncc;
5451984c4197SStefano Zampini   /* some quantities */
545245a1bb75SStefano Zampini   PetscInt          n_vertices,total_primal_vertices,valid_constraints;
5453a58a30b4SStefano Zampini   PetscInt          size_of_constraint,max_size_of_constraint=0,max_constraints,temp_constraints;
5454984c4197SStefano Zampini 
5455674ae819SStefano Zampini   PetscFunctionBegin;
54568e61c736SStefano Zampini   /* Destroy Mat objects computed previously */
54578e61c736SStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
54588e61c736SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
545916909a7fSStefano Zampini   ierr = MatDestroy(&pcbddc->switch_static_change);CHKERRQ(ierr);
5460088faed8SStefano Zampini   /* save info on constraints from previous setup (if any) */
5461088faed8SStefano Zampini   olocal_primal_size = pcbddc->local_primal_size;
54620e6343abSStefano Zampini   olocal_primal_size_cc = pcbddc->local_primal_size_cc;
54630e6343abSStefano Zampini   ierr = PetscMalloc2(olocal_primal_size_cc,&olocal_primal_ref_node,olocal_primal_size_cc,&olocal_primal_ref_mult);CHKERRQ(ierr);
54640e6343abSStefano Zampini   ierr = PetscMemcpy(olocal_primal_ref_node,pcbddc->local_primal_ref_node,olocal_primal_size_cc*sizeof(PetscInt));CHKERRQ(ierr);
54650e6343abSStefano Zampini   ierr = PetscMemcpy(olocal_primal_ref_mult,pcbddc->local_primal_ref_mult,olocal_primal_size_cc*sizeof(PetscInt));CHKERRQ(ierr);
54660e6343abSStefano Zampini   ierr = PetscFree2(pcbddc->local_primal_ref_node,pcbddc->local_primal_ref_mult);CHKERRQ(ierr);
5467088faed8SStefano Zampini   ierr = PetscFree(pcbddc->primal_indices_local_idxs);CHKERRQ(ierr);
5468cf5a6209SStefano Zampini 
5469cf5a6209SStefano Zampini   if (!pcbddc->adaptive_selection) {
54709162d606SStefano Zampini     IS           ISForVertices,*ISForFaces,*ISForEdges;
5471cf5a6209SStefano Zampini     MatNullSpace nearnullsp;
5472cf5a6209SStefano Zampini     const Vec    *nearnullvecs;
5473cf5a6209SStefano Zampini     Vec          *localnearnullsp;
5474cf5a6209SStefano Zampini     PetscScalar  *array;
5475cf5a6209SStefano Zampini     PetscInt     n_ISForFaces,n_ISForEdges,nnsp_size;
5476cf5a6209SStefano Zampini     PetscBool    nnsp_has_cnst;
5477674ae819SStefano Zampini     /* LAPACK working arrays for SVD or POD */
5478b3d85658SStefano Zampini     PetscBool    skip_lapack,boolforchange;
5479674ae819SStefano Zampini     PetscScalar  *work;
5480674ae819SStefano Zampini     PetscReal    *singular_vals;
5481674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX)
5482674ae819SStefano Zampini     PetscReal    *rwork;
5483674ae819SStefano Zampini #endif
5484674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
5485674ae819SStefano Zampini     PetscScalar  *temp_basis,*correlation_mat;
5486674ae819SStefano Zampini #else
5487964fefecSStefano Zampini     PetscBLASInt dummy_int=1;
5488964fefecSStefano Zampini     PetscScalar  dummy_scalar=1.;
5489674ae819SStefano Zampini #endif
5490674ae819SStefano Zampini 
5491674ae819SStefano Zampini     /* Get index sets for faces, edges and vertices from graph */
5492d06fc5fdSStefano Zampini     ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,&n_ISForFaces,&ISForFaces,&n_ISForEdges,&ISForEdges,&ISForVertices);CHKERRQ(ierr);
5493e4d548c7SStefano Zampini     /* print some info */
54945c643e28SStefano Zampini     if (pcbddc->dbg_flag && (!pcbddc->sub_schurs || pcbddc->sub_schurs_rebuild)) {
5495e4d548c7SStefano Zampini       PetscInt nv;
5496e4d548c7SStefano Zampini 
5497c8272957SStefano Zampini       ierr = PCBDDCGraphASCIIView(pcbddc->mat_graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr);
5498e4d548c7SStefano Zampini       ierr = ISGetSize(ISForVertices,&nv);CHKERRQ(ierr);
5499e4d548c7SStefano Zampini       ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
5500e4d548c7SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5501e4d548c7SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate vertices (%d)\n",PetscGlobalRank,nv,pcbddc->use_vertices);CHKERRQ(ierr);
5502e4d548c7SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate edges    (%d)\n",PetscGlobalRank,n_ISForEdges,pcbddc->use_edges);CHKERRQ(ierr);
5503e4d548c7SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate faces    (%d)\n",PetscGlobalRank,n_ISForFaces,pcbddc->use_faces);CHKERRQ(ierr);
5504e4d548c7SStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
5505e4d548c7SStefano Zampini       ierr = PetscViewerASCIIPopSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
5506e4d548c7SStefano Zampini     }
5507e4d548c7SStefano Zampini 
5508d06fc5fdSStefano Zampini     /* free unneeded index sets */
5509d06fc5fdSStefano Zampini     if (!pcbddc->use_vertices) {
5510d06fc5fdSStefano Zampini       ierr = ISDestroy(&ISForVertices);CHKERRQ(ierr);
5511674ae819SStefano Zampini     }
5512d06fc5fdSStefano Zampini     if (!pcbddc->use_edges) {
5513d06fc5fdSStefano Zampini       for (i=0;i<n_ISForEdges;i++) {
5514d06fc5fdSStefano Zampini         ierr = ISDestroy(&ISForEdges[i]);CHKERRQ(ierr);
5515d06fc5fdSStefano Zampini       }
5516d06fc5fdSStefano Zampini       ierr = PetscFree(ISForEdges);CHKERRQ(ierr);
5517d06fc5fdSStefano Zampini       n_ISForEdges = 0;
5518d06fc5fdSStefano Zampini     }
5519d06fc5fdSStefano Zampini     if (!pcbddc->use_faces) {
5520d06fc5fdSStefano Zampini       for (i=0;i<n_ISForFaces;i++) {
5521d06fc5fdSStefano Zampini         ierr = ISDestroy(&ISForFaces[i]);CHKERRQ(ierr);
5522d06fc5fdSStefano Zampini       }
5523d06fc5fdSStefano Zampini       ierr = PetscFree(ISForFaces);CHKERRQ(ierr);
5524d06fc5fdSStefano Zampini       n_ISForFaces = 0;
5525d06fc5fdSStefano Zampini     }
552670022509SStefano Zampini 
5527674ae819SStefano Zampini     /* check if near null space is attached to global mat */
5528674ae819SStefano Zampini     ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
5529674ae819SStefano Zampini     if (nearnullsp) {
5530674ae819SStefano Zampini       ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
5531f4ddd8eeSStefano Zampini       /* remove any stored info */
5532f4ddd8eeSStefano Zampini       ierr = MatNullSpaceDestroy(&pcbddc->onearnullspace);CHKERRQ(ierr);
5533f4ddd8eeSStefano Zampini       ierr = PetscFree(pcbddc->onearnullvecs_state);CHKERRQ(ierr);
5534f4ddd8eeSStefano Zampini       /* store information for BDDC solver reuse */
5535f4ddd8eeSStefano Zampini       ierr = PetscObjectReference((PetscObject)nearnullsp);CHKERRQ(ierr);
5536f4ddd8eeSStefano Zampini       pcbddc->onearnullspace = nearnullsp;
5537473ba861SJed Brown       ierr = PetscMalloc1(nnsp_size,&pcbddc->onearnullvecs_state);CHKERRQ(ierr);
5538f4ddd8eeSStefano Zampini       for (i=0;i<nnsp_size;i++) {
5539f4ddd8eeSStefano Zampini         ierr = PetscObjectStateGet((PetscObject)nearnullvecs[i],&pcbddc->onearnullvecs_state[i]);CHKERRQ(ierr);
5540f4ddd8eeSStefano Zampini       }
5541984c4197SStefano Zampini     } else { /* if near null space is not provided BDDC uses constants by default */
5542984c4197SStefano Zampini       nnsp_size = 0;
5543674ae819SStefano Zampini       nnsp_has_cnst = PETSC_TRUE;
5544674ae819SStefano Zampini     }
5545984c4197SStefano Zampini     /* get max number of constraints on a single cc */
5546984c4197SStefano Zampini     max_constraints = nnsp_size;
5547984c4197SStefano Zampini     if (nnsp_has_cnst) max_constraints++;
5548984c4197SStefano Zampini 
5549674ae819SStefano Zampini     /*
5550674ae819SStefano Zampini          Evaluate maximum storage size needed by the procedure
55519162d606SStefano Zampini          - Indices for connected component i stored at "constraints_idxs + constraints_idxs_ptr[i]"
55529162d606SStefano Zampini          - Values for constraints on connected component i stored at "constraints_data + constraints_data_ptr[i]"
55539162d606SStefano Zampini          There can be multiple constraints per connected component
5554674ae819SStefano Zampini                                                                                                                                                            */
5555674ae819SStefano Zampini     n_vertices = 0;
5556674ae819SStefano Zampini     if (ISForVertices) {
5557674ae819SStefano Zampini       ierr = ISGetSize(ISForVertices,&n_vertices);CHKERRQ(ierr);
5558674ae819SStefano Zampini     }
55599162d606SStefano Zampini     ncc = n_vertices+n_ISForFaces+n_ISForEdges;
55609162d606SStefano Zampini     ierr = PetscMalloc3(ncc+1,&constraints_idxs_ptr,ncc+1,&constraints_data_ptr,ncc,&constraints_n);CHKERRQ(ierr);
55619162d606SStefano Zampini 
55629162d606SStefano Zampini     total_counts = n_ISForFaces+n_ISForEdges;
55639162d606SStefano Zampini     total_counts *= max_constraints;
5564674ae819SStefano Zampini     total_counts += n_vertices;
55654641a718SStefano Zampini     ierr = PetscBTCreate(total_counts,&change_basis);CHKERRQ(ierr);
55669162d606SStefano Zampini 
5567674ae819SStefano Zampini     total_counts = 0;
5568674ae819SStefano Zampini     max_size_of_constraint = 0;
5569674ae819SStefano Zampini     for (i=0;i<n_ISForEdges+n_ISForFaces;i++) {
55709162d606SStefano Zampini       IS used_is;
5571674ae819SStefano Zampini       if (i<n_ISForEdges) {
55729162d606SStefano Zampini         used_is = ISForEdges[i];
5573674ae819SStefano Zampini       } else {
55749162d606SStefano Zampini         used_is = ISForFaces[i-n_ISForEdges];
5575674ae819SStefano Zampini       }
55769162d606SStefano Zampini       ierr = ISGetSize(used_is,&j);CHKERRQ(ierr);
5577674ae819SStefano Zampini       total_counts += j;
5578674ae819SStefano Zampini       max_size_of_constraint = PetscMax(j,max_size_of_constraint);
5579674ae819SStefano Zampini     }
55809162d606SStefano Zampini     ierr = PetscMalloc3(total_counts*max_constraints+n_vertices,&constraints_data,total_counts+n_vertices,&constraints_idxs,total_counts+n_vertices,&constraints_idxs_B);CHKERRQ(ierr);
55819162d606SStefano Zampini 
5582984c4197SStefano Zampini     /* get local part of global near null space vectors */
5583785e854fSJed Brown     ierr = PetscMalloc1(nnsp_size,&localnearnullsp);CHKERRQ(ierr);
5584984c4197SStefano Zampini     for (k=0;k<nnsp_size;k++) {
5585984c4197SStefano Zampini       ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
5586e176bc59SStefano Zampini       ierr = VecScatterBegin(matis->rctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5587e176bc59SStefano Zampini       ierr = VecScatterEnd(matis->rctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5588984c4197SStefano Zampini     }
5589674ae819SStefano Zampini 
5590242a89d7SStefano Zampini     /* whether or not to skip lapack calls */
5591242a89d7SStefano Zampini     skip_lapack = PETSC_TRUE;
5592a773dcb8SStefano Zampini     if (n_ISForFaces+n_ISForEdges && max_constraints > 1 && !pcbddc->use_nnsp_true) skip_lapack = PETSC_FALSE;
5593242a89d7SStefano Zampini 
5594984c4197SStefano Zampini     /* First we issue queries to allocate optimal workspace for LAPACKgesvd (or LAPACKsyev if SVD is missing) */
5595a773dcb8SStefano Zampini     if (!skip_lapack) {
5596674ae819SStefano Zampini       PetscScalar temp_work;
5597911cabfeSStefano Zampini 
5598674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
5599984c4197SStefano Zampini       /* Proper Orthogonal Decomposition (POD) using the snapshot method */
5600785e854fSJed Brown       ierr = PetscMalloc1(max_constraints*max_constraints,&correlation_mat);CHKERRQ(ierr);
5601785e854fSJed Brown       ierr = PetscMalloc1(max_constraints,&singular_vals);CHKERRQ(ierr);
5602785e854fSJed Brown       ierr = PetscMalloc1(max_size_of_constraint*max_constraints,&temp_basis);CHKERRQ(ierr);
5603674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX)
5604785e854fSJed Brown       ierr = PetscMalloc1(3*max_constraints,&rwork);CHKERRQ(ierr);
5605674ae819SStefano Zampini #endif
5606674ae819SStefano Zampini       /* now we evaluate the optimal workspace using query with lwork=-1 */
5607c8244a33SStefano Zampini       ierr = PetscBLASIntCast(max_constraints,&Blas_N);CHKERRQ(ierr);
5608c8244a33SStefano Zampini       ierr = PetscBLASIntCast(max_constraints,&Blas_LDA);CHKERRQ(ierr);
5609674ae819SStefano Zampini       lwork = -1;
5610674ae819SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
5611674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX)
5612c8244a33SStefano Zampini       PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,&temp_work,&lwork,&lierr));
5613674ae819SStefano Zampini #else
5614c8244a33SStefano Zampini       PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,&temp_work,&lwork,rwork,&lierr));
5615674ae819SStefano Zampini #endif
5616674ae819SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
5617984c4197SStefano Zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEV Lapack routine %d",(int)lierr);
5618674ae819SStefano Zampini #else /* on missing GESVD */
5619674ae819SStefano Zampini       /* SVD */
5620674ae819SStefano Zampini       PetscInt max_n,min_n;
5621674ae819SStefano Zampini       max_n = max_size_of_constraint;
5622984c4197SStefano Zampini       min_n = max_constraints;
5623984c4197SStefano Zampini       if (max_size_of_constraint < max_constraints) {
5624674ae819SStefano Zampini         min_n = max_size_of_constraint;
5625984c4197SStefano Zampini         max_n = max_constraints;
5626674ae819SStefano Zampini       }
5627785e854fSJed Brown       ierr = PetscMalloc1(min_n,&singular_vals);CHKERRQ(ierr);
5628674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX)
5629785e854fSJed Brown       ierr = PetscMalloc1(5*min_n,&rwork);CHKERRQ(ierr);
5630674ae819SStefano Zampini #endif
5631674ae819SStefano Zampini       /* now we evaluate the optimal workspace using query with lwork=-1 */
5632674ae819SStefano Zampini       lwork = -1;
5633e310c8b4SStefano Zampini       ierr = PetscBLASIntCast(max_n,&Blas_M);CHKERRQ(ierr);
5634e310c8b4SStefano Zampini       ierr = PetscBLASIntCast(min_n,&Blas_N);CHKERRQ(ierr);
5635b7d8b9f8SStefano Zampini       ierr = PetscBLASIntCast(max_n,&Blas_LDA);CHKERRQ(ierr);
5636674ae819SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
5637674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX)
56389162d606SStefano Zampini       PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,&constraints_data[0],&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr));
5639674ae819SStefano Zampini #else
56409162d606SStefano Zampini       PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,&constraints_data[0],&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr));
5641674ae819SStefano Zampini #endif
5642674ae819SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
5643984c4197SStefano Zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GESVD Lapack routine %d",(int)lierr);
5644984c4197SStefano Zampini #endif /* on missing GESVD */
5645674ae819SStefano Zampini       /* Allocate optimal workspace */
5646674ae819SStefano Zampini       ierr = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work),&lwork);CHKERRQ(ierr);
5647854ce69bSBarry Smith       ierr = PetscMalloc1(lwork,&work);CHKERRQ(ierr);
5648674ae819SStefano Zampini     }
5649674ae819SStefano Zampini     /* Now we can loop on constraining sets */
5650674ae819SStefano Zampini     total_counts = 0;
56519162d606SStefano Zampini     constraints_idxs_ptr[0] = 0;
56529162d606SStefano Zampini     constraints_data_ptr[0] = 0;
5653674ae819SStefano Zampini     /* vertices */
56549162d606SStefano Zampini     if (n_vertices) {
5655674ae819SStefano Zampini       ierr = ISGetIndices(ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
56569162d606SStefano Zampini       ierr = PetscMemcpy(constraints_idxs,is_indices,n_vertices*sizeof(PetscInt));CHKERRQ(ierr);
5657674ae819SStefano Zampini       for (i=0;i<n_vertices;i++) {
56589162d606SStefano Zampini         constraints_n[total_counts] = 1;
56599162d606SStefano Zampini         constraints_data[total_counts] = 1.0;
56609162d606SStefano Zampini         constraints_idxs_ptr[total_counts+1] = constraints_idxs_ptr[total_counts]+1;
56619162d606SStefano Zampini         constraints_data_ptr[total_counts+1] = constraints_data_ptr[total_counts]+1;
5662674ae819SStefano Zampini         total_counts++;
5663674ae819SStefano Zampini       }
5664674ae819SStefano Zampini       ierr = ISRestoreIndices(ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5665674ae819SStefano Zampini       n_vertices = total_counts;
5666674ae819SStefano Zampini     }
5667984c4197SStefano Zampini 
5668674ae819SStefano Zampini     /* edges and faces */
56699162d606SStefano Zampini     total_counts_cc = total_counts;
5670911cabfeSStefano Zampini     for (ncc=0;ncc<n_ISForEdges+n_ISForFaces;ncc++) {
56719162d606SStefano Zampini       IS        used_is;
56729162d606SStefano Zampini       PetscBool idxs_copied = PETSC_FALSE;
56739162d606SStefano Zampini 
5674911cabfeSStefano Zampini       if (ncc<n_ISForEdges) {
56759162d606SStefano Zampini         used_is = ISForEdges[ncc];
5676984c4197SStefano Zampini         boolforchange = pcbddc->use_change_of_basis; /* change or not the basis on the edge */
5677674ae819SStefano Zampini       } else {
56789162d606SStefano Zampini         used_is = ISForFaces[ncc-n_ISForEdges];
5679984c4197SStefano Zampini         boolforchange = (PetscBool)(pcbddc->use_change_of_basis && pcbddc->use_change_on_faces); /* change or not the basis on the face */
5680674ae819SStefano Zampini       }
5681674ae819SStefano Zampini       temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
56829162d606SStefano Zampini 
56839162d606SStefano Zampini       ierr = ISGetSize(used_is,&size_of_constraint);CHKERRQ(ierr);
56849162d606SStefano Zampini       ierr = ISGetIndices(used_is,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5685984c4197SStefano Zampini       /* change of basis should not be performed on local periodic nodes */
5686984c4197SStefano Zampini       if (pcbddc->mat_graph->mirrors && pcbddc->mat_graph->mirrors[is_indices[0]]) boolforchange = PETSC_FALSE;
5687674ae819SStefano Zampini       if (nnsp_has_cnst) {
56885b08dc53SStefano Zampini         PetscScalar quad_value;
56899162d606SStefano Zampini 
56909162d606SStefano Zampini         ierr = PetscMemcpy(constraints_idxs + constraints_idxs_ptr[total_counts_cc],is_indices,size_of_constraint*sizeof(PetscInt));CHKERRQ(ierr);
56919162d606SStefano Zampini         idxs_copied = PETSC_TRUE;
56929162d606SStefano Zampini 
5693a773dcb8SStefano Zampini         if (!pcbddc->use_nnsp_true) {
5694674ae819SStefano Zampini           quad_value = (PetscScalar)(1.0/PetscSqrtReal((PetscReal)size_of_constraint));
5695a773dcb8SStefano Zampini         } else {
5696a773dcb8SStefano Zampini           quad_value = 1.0;
5697a773dcb8SStefano Zampini         }
5698674ae819SStefano Zampini         for (j=0;j<size_of_constraint;j++) {
56999162d606SStefano Zampini           constraints_data[constraints_data_ptr[total_counts_cc]+j] = quad_value;
5700674ae819SStefano Zampini         }
57019162d606SStefano Zampini         temp_constraints++;
5702674ae819SStefano Zampini         total_counts++;
5703674ae819SStefano Zampini       }
5704674ae819SStefano Zampini       for (k=0;k<nnsp_size;k++) {
5705984c4197SStefano Zampini         PetscReal real_value;
57069162d606SStefano Zampini         PetscScalar *ptr_to_data;
57079162d606SStefano Zampini 
5708984c4197SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array);CHKERRQ(ierr);
57099162d606SStefano Zampini         ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]+temp_constraints*size_of_constraint];
5710674ae819SStefano Zampini         for (j=0;j<size_of_constraint;j++) {
57119162d606SStefano Zampini           ptr_to_data[j] = array[is_indices[j]];
5712674ae819SStefano Zampini         }
5713984c4197SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array);CHKERRQ(ierr);
5714984c4197SStefano Zampini         /* check if array is null on the connected component */
5715e310c8b4SStefano Zampini         ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr);
57169162d606SStefano Zampini         PetscStackCallBLAS("BLASasum",real_value = BLASasum_(&Blas_N,ptr_to_data,&Blas_one));
57175b08dc53SStefano Zampini         if (real_value > 0.0) { /* keep indices and values */
5718674ae819SStefano Zampini           temp_constraints++;
5719674ae819SStefano Zampini           total_counts++;
57209162d606SStefano Zampini           if (!idxs_copied) {
57219162d606SStefano Zampini             ierr = PetscMemcpy(constraints_idxs + constraints_idxs_ptr[total_counts_cc],is_indices,size_of_constraint*sizeof(PetscInt));CHKERRQ(ierr);
57229162d606SStefano Zampini             idxs_copied = PETSC_TRUE;
5723674ae819SStefano Zampini           }
5724674ae819SStefano Zampini         }
57259162d606SStefano Zampini       }
57269162d606SStefano Zampini       ierr = ISRestoreIndices(used_is,(const PetscInt**)&is_indices);CHKERRQ(ierr);
572745a1bb75SStefano Zampini       valid_constraints = temp_constraints;
5728eb97c9d2SStefano Zampini       if (!pcbddc->use_nnsp_true && temp_constraints) {
5729a773dcb8SStefano Zampini         if (temp_constraints == 1) { /* just normalize the constraint */
57309162d606SStefano Zampini           PetscScalar norm,*ptr_to_data;
57319162d606SStefano Zampini 
57329162d606SStefano Zampini           ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]];
5733a773dcb8SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr);
57349162d606SStefano Zampini           PetscStackCallBLAS("BLASdot",norm = BLASdot_(&Blas_N,ptr_to_data,&Blas_one,ptr_to_data,&Blas_one));
5735a773dcb8SStefano Zampini           norm = 1.0/PetscSqrtReal(PetscRealPart(norm));
57369162d606SStefano Zampini           PetscStackCallBLAS("BLASscal",BLASscal_(&Blas_N,&norm,ptr_to_data,&Blas_one));
5737a773dcb8SStefano Zampini         } else { /* perform SVD */
5738984c4197SStefano Zampini           PetscReal   tol = 1.0e-8; /* tolerance for retaining eigenmodes */
57399162d606SStefano Zampini           PetscScalar *ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]];
5740674ae819SStefano Zampini 
5741674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
5742984c4197SStefano Zampini           /* SVD: Y = U*S*V^H                -> U (eigenvectors of Y*Y^H) = Y*V*(S)^\dag
5743984c4197SStefano Zampini              POD: Y^H*Y = V*D*V^H, D = S^H*S -> U = Y*V*D^(-1/2)
5744984c4197SStefano Zampini              -> When PETSC_USE_COMPLEX and PETSC_MISSING_LAPACK_GESVD are defined
5745984c4197SStefano Zampini                 the constraints basis will differ (by a complex factor with absolute value equal to 1)
5746984c4197SStefano Zampini                 from that computed using LAPACKgesvd
5747984c4197SStefano Zampini              -> This is due to a different computation of eigenvectors in LAPACKheev
5748984c4197SStefano Zampini              -> The quality of the POD-computed basis will be the same */
5749984c4197SStefano Zampini           ierr = PetscMemzero(correlation_mat,temp_constraints*temp_constraints*sizeof(PetscScalar));CHKERRQ(ierr);
5750674ae819SStefano Zampini           /* Store upper triangular part of correlation matrix */
5751e310c8b4SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr);
5752984c4197SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
5753674ae819SStefano Zampini           for (j=0;j<temp_constraints;j++) {
5754674ae819SStefano Zampini             for (k=0;k<j+1;k++) {
57559162d606SStefano Zampini               PetscStackCallBLAS("BLASdot",correlation_mat[j*temp_constraints+k] = BLASdot_(&Blas_N,ptr_to_data+k*size_of_constraint,&Blas_one,ptr_to_data+j*size_of_constraint,&Blas_one));
5756674ae819SStefano Zampini             }
5757674ae819SStefano Zampini           }
5758e310c8b4SStefano Zampini           /* compute eigenvalues and eigenvectors of correlation matrix */
5759e310c8b4SStefano Zampini           ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr);
5760e310c8b4SStefano Zampini           ierr = PetscBLASIntCast(temp_constraints,&Blas_LDA);CHKERRQ(ierr);
5761674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX)
5762c8244a33SStefano Zampini           PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,work,&lwork,&lierr));
5763674ae819SStefano Zampini #else
5764c8244a33SStefano Zampini           PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,work,&lwork,rwork,&lierr));
5765674ae819SStefano Zampini #endif
5766674ae819SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
5767984c4197SStefano Zampini           if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEV Lapack routine %d",(int)lierr);
5768984c4197SStefano Zampini           /* retain eigenvalues greater than tol: note that LAPACKsyev gives eigs in ascending order */
5769674ae819SStefano Zampini           j = 0;
5770984c4197SStefano Zampini           while (j < temp_constraints && singular_vals[j] < tol) j++;
5771674ae819SStefano Zampini           total_counts = total_counts-j;
577245a1bb75SStefano Zampini           valid_constraints = temp_constraints-j;
5773e310c8b4SStefano Zampini           /* scale and copy POD basis into used quadrature memory */
5774c4303822SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr);
5775c4303822SStefano Zampini           ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr);
5776c4303822SStefano Zampini           ierr = PetscBLASIntCast(temp_constraints,&Blas_K);CHKERRQ(ierr);
5777c4303822SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
5778c4303822SStefano Zampini           ierr = PetscBLASIntCast(temp_constraints,&Blas_LDB);CHKERRQ(ierr);
5779c4303822SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDC);CHKERRQ(ierr);
5780674ae819SStefano Zampini           if (j<temp_constraints) {
5781984c4197SStefano Zampini             PetscInt ii;
5782984c4197SStefano Zampini             for (k=j;k<temp_constraints;k++) singular_vals[k] = 1.0/PetscSqrtReal(singular_vals[k]);
5783674ae819SStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
57849162d606SStefano Zampini             PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&Blas_M,&Blas_N,&Blas_K,&one,ptr_to_data,&Blas_LDA,correlation_mat,&Blas_LDB,&zero,temp_basis,&Blas_LDC));
5785674ae819SStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
5786984c4197SStefano Zampini             for (k=0;k<temp_constraints-j;k++) {
5787674ae819SStefano Zampini               for (ii=0;ii<size_of_constraint;ii++) {
57889162d606SStefano Zampini                 ptr_to_data[k*size_of_constraint+ii] = singular_vals[temp_constraints-1-k]*temp_basis[(temp_constraints-1-k)*size_of_constraint+ii];
5789674ae819SStefano Zampini               }
5790674ae819SStefano Zampini             }
5791674ae819SStefano Zampini           }
5792674ae819SStefano Zampini #else  /* on missing GESVD */
5793e310c8b4SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr);
5794e310c8b4SStefano Zampini           ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr);
5795b7d8b9f8SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
5796674ae819SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
5797674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX)
57989162d606SStefano Zampini           PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,ptr_to_data,&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr));
5799674ae819SStefano Zampini #else
58009162d606SStefano Zampini           PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,ptr_to_data,&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr));
5801674ae819SStefano Zampini #endif
5802984c4197SStefano Zampini           if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESVD Lapack routine %d",(int)lierr);
5803674ae819SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
5804984c4197SStefano Zampini           /* retain eigenvalues greater than tol: note that LAPACKgesvd gives eigs in descending order */
5805e310c8b4SStefano Zampini           k = temp_constraints;
5806e310c8b4SStefano Zampini           if (k > size_of_constraint) k = size_of_constraint;
5807674ae819SStefano Zampini           j = 0;
5808e310c8b4SStefano Zampini           while (j < k && singular_vals[k-j-1] < tol) j++;
580945a1bb75SStefano Zampini           valid_constraints = k-j;
5810911cabfeSStefano Zampini           total_counts = total_counts-temp_constraints+valid_constraints;
5811984c4197SStefano Zampini #endif /* on missing GESVD */
5812674ae819SStefano Zampini         }
5813a773dcb8SStefano Zampini       }
58149162d606SStefano Zampini       /* update pointers information */
58159162d606SStefano Zampini       if (valid_constraints) {
58169162d606SStefano Zampini         constraints_n[total_counts_cc] = valid_constraints;
58179162d606SStefano Zampini         constraints_idxs_ptr[total_counts_cc+1] = constraints_idxs_ptr[total_counts_cc]+size_of_constraint;
58189162d606SStefano Zampini         constraints_data_ptr[total_counts_cc+1] = constraints_data_ptr[total_counts_cc]+size_of_constraint*valid_constraints;
58199162d606SStefano Zampini         /* set change_of_basis flag */
582045a1bb75SStefano Zampini         if (boolforchange) {
5821b3d85658SStefano Zampini           PetscBTSet(change_basis,total_counts_cc);
58229162d606SStefano Zampini         }
5823b3d85658SStefano Zampini         total_counts_cc++;
582445a1bb75SStefano Zampini       }
582545a1bb75SStefano Zampini     }
5826984c4197SStefano Zampini     /* free workspace */
58278f1c130eSStefano Zampini     if (!skip_lapack) {
5828984c4197SStefano Zampini       ierr = PetscFree(work);CHKERRQ(ierr);
5829984c4197SStefano Zampini #if defined(PETSC_USE_COMPLEX)
5830984c4197SStefano Zampini       ierr = PetscFree(rwork);CHKERRQ(ierr);
5831984c4197SStefano Zampini #endif
5832984c4197SStefano Zampini       ierr = PetscFree(singular_vals);CHKERRQ(ierr);
5833984c4197SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
5834984c4197SStefano Zampini       ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
5835984c4197SStefano Zampini       ierr = PetscFree(temp_basis);CHKERRQ(ierr);
5836984c4197SStefano Zampini #endif
5837984c4197SStefano Zampini     }
5838984c4197SStefano Zampini     for (k=0;k<nnsp_size;k++) {
5839984c4197SStefano Zampini       ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
5840984c4197SStefano Zampini     }
5841984c4197SStefano Zampini     ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
5842cf5a6209SStefano Zampini     /* free index sets of faces, edges and vertices */
5843cf5a6209SStefano Zampini     for (i=0;i<n_ISForFaces;i++) {
5844cf5a6209SStefano Zampini       ierr = ISDestroy(&ISForFaces[i]);CHKERRQ(ierr);
5845cf5a6209SStefano Zampini     }
5846cf5a6209SStefano Zampini     if (n_ISForFaces) {
5847cf5a6209SStefano Zampini       ierr = PetscFree(ISForFaces);CHKERRQ(ierr);
5848cf5a6209SStefano Zampini     }
5849cf5a6209SStefano Zampini     for (i=0;i<n_ISForEdges;i++) {
5850cf5a6209SStefano Zampini       ierr = ISDestroy(&ISForEdges[i]);CHKERRQ(ierr);
5851cf5a6209SStefano Zampini     }
5852cf5a6209SStefano Zampini     if (n_ISForEdges) {
5853cf5a6209SStefano Zampini       ierr = PetscFree(ISForEdges);CHKERRQ(ierr);
5854cf5a6209SStefano Zampini     }
5855cf5a6209SStefano Zampini     ierr = ISDestroy(&ISForVertices);CHKERRQ(ierr);
585608122e43SStefano Zampini   } else {
585708122e43SStefano Zampini     PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs;
5858984c4197SStefano Zampini 
585908122e43SStefano Zampini     total_counts = 0;
586008122e43SStefano Zampini     n_vertices = 0;
5861d62866d3SStefano Zampini     if (sub_schurs->is_vertices && pcbddc->use_vertices) {
5862d62866d3SStefano Zampini       ierr = ISGetLocalSize(sub_schurs->is_vertices,&n_vertices);CHKERRQ(ierr);
586308122e43SStefano Zampini     }
586408122e43SStefano Zampini     max_constraints = 0;
58659162d606SStefano Zampini     total_counts_cc = 0;
586608122e43SStefano Zampini     for (i=0;i<sub_schurs->n_subs+n_vertices;i++) {
586708122e43SStefano Zampini       total_counts += pcbddc->adaptive_constraints_n[i];
58689162d606SStefano Zampini       if (pcbddc->adaptive_constraints_n[i]) total_counts_cc++;
586908122e43SStefano Zampini       max_constraints = PetscMax(max_constraints,pcbddc->adaptive_constraints_n[i]);
587008122e43SStefano Zampini     }
58719162d606SStefano Zampini     constraints_idxs_ptr = pcbddc->adaptive_constraints_idxs_ptr;
58729162d606SStefano Zampini     constraints_data_ptr = pcbddc->adaptive_constraints_data_ptr;
58739162d606SStefano Zampini     constraints_idxs = pcbddc->adaptive_constraints_idxs;
58749162d606SStefano Zampini     constraints_data = pcbddc->adaptive_constraints_data;
587574d5cdf7SStefano Zampini     /* constraints_n differs from pcbddc->adaptive_constraints_n */
58769162d606SStefano Zampini     ierr = PetscMalloc1(total_counts_cc,&constraints_n);CHKERRQ(ierr);
58779162d606SStefano Zampini     total_counts_cc = 0;
58789162d606SStefano Zampini     for (i=0;i<sub_schurs->n_subs+n_vertices;i++) {
58799162d606SStefano Zampini       if (pcbddc->adaptive_constraints_n[i]) {
58809162d606SStefano Zampini         constraints_n[total_counts_cc++] = pcbddc->adaptive_constraints_n[i];
588108122e43SStefano Zampini       }
588208122e43SStefano Zampini     }
58839162d606SStefano Zampini #if 0
58849162d606SStefano Zampini     printf("Found %d totals (%d)\n",total_counts_cc,total_counts);
58859162d606SStefano Zampini     for (i=0;i<total_counts_cc;i++) {
58869162d606SStefano Zampini       printf("const %d, start %d",i,constraints_idxs_ptr[i]);
58879162d606SStefano Zampini       printf(" end %d:\n",constraints_idxs_ptr[i+1]);
58889162d606SStefano Zampini       for (j=constraints_idxs_ptr[i];j<constraints_idxs_ptr[i+1];j++) {
58899162d606SStefano Zampini         printf(" %d",constraints_idxs[j]);
58909162d606SStefano Zampini       }
58919162d606SStefano Zampini       printf("\n");
58929162d606SStefano Zampini       printf("number of cc: %d\n",constraints_n[i]);
58939162d606SStefano Zampini     }
58941b968477SStefano Zampini     for (i=0;i<n_vertices;i++) {
58958bec7fa6SStefano Zampini       PetscPrintf(PETSC_COMM_SELF,"[%d] vertex %d, n %d\n",PetscGlobalRank,i,pcbddc->adaptive_constraints_n[i]);
58961b968477SStefano Zampini     }
58971b968477SStefano Zampini     for (i=0;i<sub_schurs->n_subs;i++) {
58988bec7fa6SStefano Zampini       PetscPrintf(PETSC_COMM_SELF,"[%d] sub %d, edge %d, n %d\n",PetscGlobalRank,i,(PetscBool)PetscBTLookup(sub_schurs->is_edge,i),pcbddc->adaptive_constraints_n[i+n_vertices]);
58991b968477SStefano Zampini     }
590008122e43SStefano Zampini #endif
590108122e43SStefano Zampini 
59028bec7fa6SStefano Zampini     max_size_of_constraint = 0;
59039162d606SStefano Zampini     for (i=0;i<total_counts_cc;i++) max_size_of_constraint = PetscMax(max_size_of_constraint,constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]);
59049162d606SStefano Zampini     ierr = PetscMalloc1(constraints_idxs_ptr[total_counts_cc],&constraints_idxs_B);CHKERRQ(ierr);
590508122e43SStefano Zampini     /* Change of basis */
5906b3d85658SStefano Zampini     ierr = PetscBTCreate(total_counts_cc,&change_basis);CHKERRQ(ierr);
590708122e43SStefano Zampini     if (pcbddc->use_change_of_basis) {
590808122e43SStefano Zampini       for (i=0;i<sub_schurs->n_subs;i++) {
590908122e43SStefano Zampini         if (PetscBTLookup(sub_schurs->is_edge,i) || pcbddc->use_change_on_faces) {
5910b3d85658SStefano Zampini           ierr = PetscBTSet(change_basis,i+n_vertices);CHKERRQ(ierr);
591108122e43SStefano Zampini         }
591208122e43SStefano Zampini       }
591308122e43SStefano Zampini     }
591408122e43SStefano Zampini   }
5915984c4197SStefano Zampini   pcbddc->local_primal_size = total_counts;
59164f1b2e48SStefano Zampini   ierr = PetscMalloc1(pcbddc->local_primal_size+pcbddc->benign_n,&pcbddc->primal_indices_local_idxs);CHKERRQ(ierr);
591708122e43SStefano Zampini 
59189162d606SStefano Zampini   /* map constraints_idxs in boundary numbering */
59199162d606SStefano Zampini   ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,constraints_idxs_ptr[total_counts_cc],constraints_idxs,&i,constraints_idxs_B);CHKERRQ(ierr);
5920eee23b56SStefano Zampini   if (i != constraints_idxs_ptr[total_counts_cc]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for constraints indices %D != %D\n",constraints_idxs_ptr[total_counts_cc],i);
5921674ae819SStefano Zampini 
5922674ae819SStefano Zampini   /* Create constraint matrix */
5923674ae819SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
592416f15bc4SStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,MATAIJ);CHKERRQ(ierr);
5925984c4197SStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,pcbddc->local_primal_size,pcis->n,pcbddc->local_primal_size,pcis->n);CHKERRQ(ierr);
5926984c4197SStefano Zampini 
5927984c4197SStefano Zampini   /* find primal_dofs: subdomain corners plus dofs selected as primal after change of basis */
5928a717540cSStefano Zampini   /* determine if a QR strategy is needed for change of basis */
5929a717540cSStefano Zampini   qr_needed = PETSC_FALSE;
593074d5cdf7SStefano Zampini   ierr = PetscBTCreate(total_counts_cc,&qr_needed_idx);CHKERRQ(ierr);
5931984c4197SStefano Zampini   total_primal_vertices=0;
5932b3d85658SStefano Zampini   pcbddc->local_primal_size_cc = 0;
59339162d606SStefano Zampini   for (i=0;i<total_counts_cc;i++) {
59349162d606SStefano Zampini     size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i];
593572b8c272SStefano Zampini     if (size_of_constraint == 1 && pcbddc->mat_graph->custom_minimal_size) {
59369162d606SStefano Zampini       pcbddc->primal_indices_local_idxs[total_primal_vertices++] = constraints_idxs[constraints_idxs_ptr[i]];
5937b3d85658SStefano Zampini       pcbddc->local_primal_size_cc += 1;
593864efe560SStefano Zampini     } else if (PetscBTLookup(change_basis,i)) {
59399162d606SStefano Zampini       for (k=0;k<constraints_n[i];k++) {
59409162d606SStefano Zampini         pcbddc->primal_indices_local_idxs[total_primal_vertices++] = constraints_idxs[constraints_idxs_ptr[i]+k];
5941a717540cSStefano Zampini       }
5942b3d85658SStefano Zampini       pcbddc->local_primal_size_cc += constraints_n[i];
594391af6908SStefano Zampini       if (constraints_n[i] > 1 || pcbddc->use_qr_single) {
5944a717540cSStefano Zampini         PetscBTSet(qr_needed_idx,i);
5945a717540cSStefano Zampini         qr_needed = PETSC_TRUE;
5946a717540cSStefano Zampini       }
5947fa434743SStefano Zampini     } else {
5948b3d85658SStefano Zampini       pcbddc->local_primal_size_cc += 1;
5949fa434743SStefano Zampini     }
5950a717540cSStefano Zampini   }
5951b371cd4fSStefano Zampini   /* note that the local variable n_vertices used below stores the number of pointwise constraints */
5952b371cd4fSStefano Zampini   pcbddc->n_vertices = total_primal_vertices;
5953674ae819SStefano Zampini   /* permute indices in order to have a sorted set of vertices */
595470022509SStefano Zampini   ierr = PetscSortInt(total_primal_vertices,pcbddc->primal_indices_local_idxs);CHKERRQ(ierr);
59554f1b2e48SStefano Zampini   ierr = PetscMalloc2(pcbddc->local_primal_size_cc+pcbddc->benign_n,&pcbddc->local_primal_ref_node,pcbddc->local_primal_size_cc+pcbddc->benign_n,&pcbddc->local_primal_ref_mult);CHKERRQ(ierr);
59560e6343abSStefano Zampini   ierr = PetscMemcpy(pcbddc->local_primal_ref_node,pcbddc->primal_indices_local_idxs,total_primal_vertices*sizeof(PetscInt));CHKERRQ(ierr);
59570e6343abSStefano Zampini   for (i=0;i<total_primal_vertices;i++) pcbddc->local_primal_ref_mult[i] = 1;
5958984c4197SStefano Zampini 
5959984c4197SStefano Zampini   /* nonzero structure of constraint matrix */
596074d5cdf7SStefano Zampini   /* and get reference dof for local constraints */
5961785e854fSJed Brown   ierr = PetscMalloc1(pcbddc->local_primal_size,&nnz);CHKERRQ(ierr);
5962984c4197SStefano Zampini   for (i=0;i<total_primal_vertices;i++) nnz[i] = 1;
596374d5cdf7SStefano Zampini 
5964984c4197SStefano Zampini   j = total_primal_vertices;
596574d5cdf7SStefano Zampini   total_counts = total_primal_vertices;
5966b3d85658SStefano Zampini   cum = total_primal_vertices;
59679162d606SStefano Zampini   for (i=n_vertices;i<total_counts_cc;i++) {
59684641a718SStefano Zampini     if (!PetscBTLookup(change_basis,i)) {
5969b3d85658SStefano Zampini       pcbddc->local_primal_ref_node[cum] = constraints_idxs[constraints_idxs_ptr[i]];
5970b3d85658SStefano Zampini       pcbddc->local_primal_ref_mult[cum] = constraints_n[i];
5971b3d85658SStefano Zampini       cum++;
59729162d606SStefano Zampini       size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i];
597374d5cdf7SStefano Zampini       for (k=0;k<constraints_n[i];k++) {
597474d5cdf7SStefano Zampini         pcbddc->primal_indices_local_idxs[total_counts++] = constraints_idxs[constraints_idxs_ptr[i]+k];
597574d5cdf7SStefano Zampini         nnz[j+k] = size_of_constraint;
597674d5cdf7SStefano Zampini       }
59779162d606SStefano Zampini       j += constraints_n[i];
5978674ae819SStefano Zampini     }
5979674ae819SStefano Zampini   }
5980674ae819SStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
5981674ae819SStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
5982088faed8SStefano Zampini 
5983674ae819SStefano Zampini   /* set values in constraint matrix */
5984984c4197SStefano Zampini   for (i=0;i<total_primal_vertices;i++) {
59850e6343abSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,pcbddc->local_primal_ref_node[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
5986674ae819SStefano Zampini   }
5987984c4197SStefano Zampini   total_counts = total_primal_vertices;
59889162d606SStefano Zampini   for (i=n_vertices;i<total_counts_cc;i++) {
59894641a718SStefano Zampini     if (!PetscBTLookup(change_basis,i)) {
59909162d606SStefano Zampini       PetscInt *cols;
59919162d606SStefano Zampini 
59929162d606SStefano Zampini       size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i];
59939162d606SStefano Zampini       cols = constraints_idxs+constraints_idxs_ptr[i];
59949162d606SStefano Zampini       for (k=0;k<constraints_n[i];k++) {
59959162d606SStefano Zampini         PetscInt    row = total_counts+k;
59969162d606SStefano Zampini         PetscScalar *vals;
59979162d606SStefano Zampini 
59989162d606SStefano Zampini         vals = constraints_data+constraints_data_ptr[i]+k*size_of_constraint;
59999162d606SStefano Zampini         ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&row,size_of_constraint,cols,vals,INSERT_VALUES);CHKERRQ(ierr);
60009162d606SStefano Zampini       }
60019162d606SStefano Zampini       total_counts += constraints_n[i];
6002674ae819SStefano Zampini     }
6003674ae819SStefano Zampini   }
6004674ae819SStefano Zampini   /* assembling */
6005674ae819SStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6006674ae819SStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6007088faed8SStefano Zampini 
6008984c4197SStefano Zampini   /*
60096a9046bcSBarry Smith   ierr = PetscViewerPushFormat(PETSC_VIEWER_STDOUT_SELF,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
6010984c4197SStefano Zampini   ierr = MatView(pcbddc->ConstraintMatrix,(PetscViewer)0);CHKERRQ(ierr);
6011f159cad9SBarry Smith   ierr = PetscViewerPopFormat(PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr);
6012984c4197SStefano Zampini   */
6013674ae819SStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->use_change_of_basis is FALSE */
6014674ae819SStefano Zampini   if (pcbddc->use_change_of_basis) {
6015026de310SStefano Zampini     /* dual and primal dofs on a single cc */
6016984c4197SStefano Zampini     PetscInt     dual_dofs,primal_dofs;
6017984c4197SStefano Zampini     /* working stuff for GEQRF */
601881d9aea3SBarry Smith     PetscScalar  *qr_basis,*qr_tau = NULL,*qr_work,lqr_work_t;
6019984c4197SStefano Zampini     PetscBLASInt lqr_work;
6020984c4197SStefano Zampini     /* working stuff for UNGQR */
6021984c4197SStefano Zampini     PetscScalar  *gqr_work,lgqr_work_t;
6022984c4197SStefano Zampini     PetscBLASInt lgqr_work;
6023984c4197SStefano Zampini     /* working stuff for TRTRS */
6024984c4197SStefano Zampini     PetscScalar  *trs_rhs;
60253f08241aSStefano Zampini     PetscBLASInt Blas_NRHS;
6026984c4197SStefano Zampini     /* pointers for values insertion into change of basis matrix */
6027984c4197SStefano Zampini     PetscInt     *start_rows,*start_cols;
6028984c4197SStefano Zampini     PetscScalar  *start_vals;
6029984c4197SStefano Zampini     /* working stuff for values insertion */
60304641a718SStefano Zampini     PetscBT      is_primal;
603164efe560SStefano Zampini     PetscInt     *aux_primal_numbering_B;
6032906d46d4SStefano Zampini     /* matrix sizes */
6033906d46d4SStefano Zampini     PetscInt     global_size,local_size;
6034906d46d4SStefano Zampini     /* temporary change of basis */
6035906d46d4SStefano Zampini     Mat          localChangeOfBasisMatrix;
6036cf5a6209SStefano Zampini     /* extra space for debugging */
6037cf5a6209SStefano Zampini     PetscScalar  *dbg_work;
6038984c4197SStefano Zampini 
6039906d46d4SStefano Zampini     /* local temporary change of basis acts on local interfaces -> dimension is n_B x n_B */
6040906d46d4SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&localChangeOfBasisMatrix);CHKERRQ(ierr);
604116f15bc4SStefano Zampini     ierr = MatSetType(localChangeOfBasisMatrix,MATAIJ);CHKERRQ(ierr);
6042bbb9e6c6SStefano Zampini     ierr = MatSetSizes(localChangeOfBasisMatrix,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
6043906d46d4SStefano Zampini     /* nonzeros for local mat */
6044bbb9e6c6SStefano Zampini     ierr = PetscMalloc1(pcis->n,&nnz);CHKERRQ(ierr);
60451dd7afcfSStefano Zampini     if (!pcbddc->benign_change || pcbddc->fake_change) {
6046bbb9e6c6SStefano Zampini       for (i=0;i<pcis->n;i++) nnz[i]=1;
60471dd7afcfSStefano Zampini     } else {
60481dd7afcfSStefano Zampini       const PetscInt *ii;
60491dd7afcfSStefano Zampini       PetscInt       n;
60501dd7afcfSStefano Zampini       PetscBool      flg_row;
60511dd7afcfSStefano Zampini       ierr = MatGetRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,NULL,&flg_row);CHKERRQ(ierr);
60521dd7afcfSStefano Zampini       for (i=0;i<n;i++) nnz[i] = ii[i+1]-ii[i];
60531dd7afcfSStefano Zampini       ierr = MatRestoreRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,NULL,&flg_row);CHKERRQ(ierr);
60541dd7afcfSStefano Zampini     }
60559162d606SStefano Zampini     for (i=n_vertices;i<total_counts_cc;i++) {
6056a717540cSStefano Zampini       if (PetscBTLookup(change_basis,i)) {
60579162d606SStefano Zampini         size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i];
6058a717540cSStefano Zampini         if (PetscBTLookup(qr_needed_idx,i)) {
60599162d606SStefano Zampini           for (j=0;j<size_of_constraint;j++) nnz[constraints_idxs[constraints_idxs_ptr[i]+j]] = size_of_constraint;
6060a717540cSStefano Zampini         } else {
60619162d606SStefano Zampini           nnz[constraints_idxs[constraints_idxs_ptr[i]]] = size_of_constraint;
60629162d606SStefano Zampini           for (j=1;j<size_of_constraint;j++) nnz[constraints_idxs[constraints_idxs_ptr[i]+j]] = 2;
6063a717540cSStefano Zampini         }
6064a717540cSStefano Zampini       }
6065a717540cSStefano Zampini     }
6066906d46d4SStefano Zampini     ierr = MatSeqAIJSetPreallocation(localChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
6067bbb9e6c6SStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
60681dd7afcfSStefano Zampini     /* Set interior change in the matrix */
60691dd7afcfSStefano Zampini     if (!pcbddc->benign_change || pcbddc->fake_change) {
6070bbb9e6c6SStefano Zampini       for (i=0;i<pcis->n;i++) {
6071906d46d4SStefano Zampini         ierr = MatSetValue(localChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
6072a717540cSStefano Zampini       }
60731dd7afcfSStefano Zampini     } else {
60741dd7afcfSStefano Zampini       const PetscInt *ii,*jj;
60751dd7afcfSStefano Zampini       PetscScalar    *aa;
60761dd7afcfSStefano Zampini       PetscInt       n;
60771dd7afcfSStefano Zampini       PetscBool      flg_row;
60781dd7afcfSStefano Zampini       ierr = MatGetRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&jj,&flg_row);CHKERRQ(ierr);
60791dd7afcfSStefano Zampini       ierr = MatSeqAIJGetArray(pcbddc->benign_change,&aa);CHKERRQ(ierr);
60801dd7afcfSStefano Zampini       for (i=0;i<n;i++) {
60811dd7afcfSStefano Zampini         ierr = MatSetValues(localChangeOfBasisMatrix,1,&i,ii[i+1]-ii[i],jj+ii[i],aa+ii[i],INSERT_VALUES);CHKERRQ(ierr);
60821dd7afcfSStefano Zampini       }
60831dd7afcfSStefano Zampini       ierr = MatSeqAIJRestoreArray(pcbddc->benign_change,&aa);CHKERRQ(ierr);
60841dd7afcfSStefano Zampini       ierr = MatRestoreRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&jj,&flg_row);CHKERRQ(ierr);
60851dd7afcfSStefano Zampini     }
6086a717540cSStefano Zampini 
6087a717540cSStefano Zampini     if (pcbddc->dbg_flag) {
6088a717540cSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
6089a717540cSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Checking change of basis computation for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
6090a717540cSStefano Zampini     }
6091a717540cSStefano Zampini 
6092a717540cSStefano Zampini 
6093a717540cSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
6094a717540cSStefano Zampini     /*
6095a717540cSStefano Zampini        Change of basis matrix is evaluated similarly to the FIRST APPROACH in
6096a717540cSStefano Zampini        Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (see Sect 6.2.1)
6097a717540cSStefano Zampini 
6098a6b551f4SStefano Zampini        Basic blocks of change of basis matrix T computed by
6099a717540cSStefano Zampini 
6100a6b551f4SStefano Zampini           - Using the following block transformation if there is only a primal dof on the cc (and -pc_bddc_use_qr_single is not specified)
6101a6b551f4SStefano Zampini 
6102a6b551f4SStefano Zampini             | 1        0   ...        0         s_1/S |
6103a6b551f4SStefano Zampini             | 0        1   ...        0         s_2/S |
6104a717540cSStefano Zampini             |              ...                        |
6105a6b551f4SStefano Zampini             | 0        ...            1     s_{n-1}/S |
6106a6b551f4SStefano Zampini             | -s_1/s_n ...    -s_{n-1}/s_n      s_n/S |
6107a717540cSStefano Zampini 
6108a6b551f4SStefano Zampini             with S = \sum_{i=1}^n s_i^2
6109a6b551f4SStefano Zampini             NOTE: in the above example, the primal dof is the last one of the edge in LOCAL ordering
6110a6b551f4SStefano Zampini                   in the current implementation, the primal dof is the first one of the edge in GLOBAL ordering
6111a6b551f4SStefano Zampini 
6112a6b551f4SStefano Zampini           - QR decomposition of constraints otherwise
6113a717540cSStefano Zampini     */
6114a717540cSStefano Zampini     if (qr_needed) {
6115984c4197SStefano Zampini       /* space to store Q */
6116854ce69bSBarry Smith       ierr = PetscMalloc1(max_size_of_constraint*max_size_of_constraint,&qr_basis);CHKERRQ(ierr);
61174e64d54eSstefano_zampini       /* array to store scaling factors for reflectors */
61184e64d54eSstefano_zampini       ierr = PetscMalloc1(max_constraints,&qr_tau);CHKERRQ(ierr);
6119984c4197SStefano Zampini       /* first we issue queries for optimal work */
61203f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_M);CHKERRQ(ierr);
61213f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_constraints,&Blas_N);CHKERRQ(ierr);
61223f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
6123984c4197SStefano Zampini       lqr_work = -1;
61243f08241aSStefano Zampini       PetscStackCallBLAS("LAPACKgeqrf",LAPACKgeqrf_(&Blas_M,&Blas_N,qr_basis,&Blas_LDA,qr_tau,&lqr_work_t,&lqr_work,&lierr));
6125984c4197SStefano Zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GEQRF Lapack routine %d",(int)lierr);
6126984c4197SStefano Zampini       ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lqr_work_t),&lqr_work);CHKERRQ(ierr);
6127785e854fSJed Brown       ierr = PetscMalloc1((PetscInt)PetscRealPart(lqr_work_t),&qr_work);CHKERRQ(ierr);
6128984c4197SStefano Zampini       lgqr_work = -1;
61293f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_M);CHKERRQ(ierr);
61303f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_N);CHKERRQ(ierr);
61313f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_constraints,&Blas_K);CHKERRQ(ierr);
61323f08241aSStefano Zampini       ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
61333f08241aSStefano Zampini       if (Blas_K>Blas_M) Blas_K=Blas_M; /* adjust just for computing optimal work */
6134*c964aadfSJose E. Roman       PetscStackCallBLAS("LAPACKorgqr",LAPACKorgqr_(&Blas_M,&Blas_N,&Blas_K,qr_basis,&Blas_LDA,qr_tau,&lgqr_work_t,&lgqr_work,&lierr));
6135*c964aadfSJose E. Roman       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to ORGQR/UNGQR Lapack routine %d",(int)lierr);
6136984c4197SStefano Zampini       ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lgqr_work_t),&lgqr_work);CHKERRQ(ierr);
6137785e854fSJed Brown       ierr = PetscMalloc1((PetscInt)PetscRealPart(lgqr_work_t),&gqr_work);CHKERRQ(ierr);
6138984c4197SStefano Zampini       /* array to store rhs and solution of triangular solver */
6139785e854fSJed Brown       ierr = PetscMalloc1(max_constraints*max_constraints,&trs_rhs);CHKERRQ(ierr);
6140a717540cSStefano Zampini       /* allocating workspace for check */
6141a717540cSStefano Zampini       if (pcbddc->dbg_flag) {
6142cf5a6209SStefano Zampini         ierr = PetscMalloc1(max_size_of_constraint*(max_constraints+max_size_of_constraint),&dbg_work);CHKERRQ(ierr);
6143a717540cSStefano Zampini       }
6144a717540cSStefano Zampini     }
6145984c4197SStefano Zampini     /* array to store whether a node is primal or not */
61464641a718SStefano Zampini     ierr = PetscBTCreate(pcis->n_B,&is_primal);CHKERRQ(ierr);
6147473ba861SJed Brown     ierr = PetscMalloc1(total_primal_vertices,&aux_primal_numbering_B);CHKERRQ(ierr);
61480e6343abSStefano Zampini     ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,total_primal_vertices,pcbddc->local_primal_ref_node,&i,aux_primal_numbering_B);CHKERRQ(ierr);
6149eee23b56SStefano Zampini     if (i != total_primal_vertices) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for BDDC vertices! %D != %D\n",total_primal_vertices,i);
615039e2fb2aSStefano Zampini     for (i=0;i<total_primal_vertices;i++) {
615139e2fb2aSStefano Zampini       ierr = PetscBTSet(is_primal,aux_primal_numbering_B[i]);CHKERRQ(ierr);
615239e2fb2aSStefano Zampini     }
615339e2fb2aSStefano Zampini     ierr = PetscFree(aux_primal_numbering_B);CHKERRQ(ierr);
6154984c4197SStefano Zampini 
6155a717540cSStefano Zampini     /* loop on constraints and see whether or not they need a change of basis and compute it */
61569162d606SStefano Zampini     for (total_counts=n_vertices;total_counts<total_counts_cc;total_counts++) {
61579162d606SStefano Zampini       size_of_constraint = constraints_idxs_ptr[total_counts+1]-constraints_idxs_ptr[total_counts];
61584641a718SStefano Zampini       if (PetscBTLookup(change_basis,total_counts)) {
6159984c4197SStefano Zampini         /* get constraint info */
61609162d606SStefano Zampini         primal_dofs = constraints_n[total_counts];
6161984c4197SStefano Zampini         dual_dofs = size_of_constraint-primal_dofs;
6162984c4197SStefano Zampini 
6163984c4197SStefano Zampini         if (pcbddc->dbg_flag) {
61649162d606SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Constraints %d: %d need a change of basis (size %d)\n",total_counts,primal_dofs,size_of_constraint);CHKERRQ(ierr);
6165674ae819SStefano Zampini         }
6166984c4197SStefano Zampini 
6167fa434743SStefano Zampini         if (PetscBTLookup(qr_needed_idx,total_counts)) { /* QR */
6168a717540cSStefano Zampini 
6169a717540cSStefano Zampini           /* copy quadrature constraints for change of basis check */
6170a717540cSStefano Zampini           if (pcbddc->dbg_flag) {
61719162d606SStefano Zampini             ierr = PetscMemcpy(dbg_work,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr);
6172a717540cSStefano Zampini           }
6173984c4197SStefano Zampini           /* copy temporary constraints into larger work vector (in order to store all columns of Q) */
61749162d606SStefano Zampini           ierr = PetscMemcpy(qr_basis,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr);
6175984c4197SStefano Zampini 
6176984c4197SStefano Zampini           /* compute QR decomposition of constraints */
61773f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr);
61783f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr);
61793f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
6180674ae819SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
61813f08241aSStefano Zampini           PetscStackCallBLAS("LAPACKgeqrf",LAPACKgeqrf_(&Blas_M,&Blas_N,qr_basis,&Blas_LDA,qr_tau,qr_work,&lqr_work,&lierr));
6182984c4197SStefano Zampini           if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GEQRF Lapack routine %d",(int)lierr);
6183674ae819SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
6184984c4197SStefano Zampini 
6185984c4197SStefano Zampini           /* explictly compute R^-T */
6186984c4197SStefano Zampini           ierr = PetscMemzero(trs_rhs,primal_dofs*primal_dofs*sizeof(*trs_rhs));CHKERRQ(ierr);
6187984c4197SStefano Zampini           for (j=0;j<primal_dofs;j++) trs_rhs[j*(primal_dofs+1)] = 1.0;
61883f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr);
61893f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_NRHS);CHKERRQ(ierr);
61903f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
61913f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_LDB);CHKERRQ(ierr);
6192984c4197SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
61933f08241aSStefano Zampini           PetscStackCallBLAS("LAPACKtrtrs",LAPACKtrtrs_("U","T","N",&Blas_N,&Blas_NRHS,qr_basis,&Blas_LDA,trs_rhs,&Blas_LDB,&lierr));
6194984c4197SStefano Zampini           if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in TRTRS Lapack routine %d",(int)lierr);
6195984c4197SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
6196984c4197SStefano Zampini 
6197a717540cSStefano Zampini           /* explicitly compute all columns of Q (Q = [Q1 | Q2] ) overwriting QR factorization in qr_basis */
61983f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr);
61993f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr);
62003f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_K);CHKERRQ(ierr);
62013f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
6202984c4197SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
6203*c964aadfSJose E. Roman           PetscStackCallBLAS("LAPACKorgqr",LAPACKorgqr_(&Blas_M,&Blas_N,&Blas_K,qr_basis,&Blas_LDA,qr_tau,gqr_work,&lgqr_work,&lierr));
6204*c964aadfSJose E. Roman           if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in ORGQR/UNGQR Lapack routine %d",(int)lierr);
6205984c4197SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
6206984c4197SStefano Zampini 
6207984c4197SStefano Zampini           /* first primal_dofs columns of Q need to be re-scaled in order to be unitary w.r.t constraints
6208984c4197SStefano Zampini              i.e. C_{pxn}*Q_{nxn} should be equal to [I_pxp | 0_pxd] (see check below)
6209984c4197SStefano Zampini              where n=size_of_constraint, p=primal_dofs, d=dual_dofs (n=p+d), I and 0 identity and null matrix resp. */
62103f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr);
62113f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr);
62123f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_K);CHKERRQ(ierr);
62133f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
62143f08241aSStefano Zampini           ierr = PetscBLASIntCast(primal_dofs,&Blas_LDB);CHKERRQ(ierr);
62153f08241aSStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDC);CHKERRQ(ierr);
6216984c4197SStefano Zampini           ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
62179162d606SStefano Zampini           PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&Blas_M,&Blas_N,&Blas_K,&one,qr_basis,&Blas_LDA,trs_rhs,&Blas_LDB,&zero,constraints_data+constraints_data_ptr[total_counts],&Blas_LDC));
6218984c4197SStefano Zampini           ierr = PetscFPTrapPop();CHKERRQ(ierr);
62199162d606SStefano Zampini           ierr = PetscMemcpy(qr_basis,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr);
6220984c4197SStefano Zampini 
6221984c4197SStefano Zampini           /* insert values in change of basis matrix respecting global ordering of new primal dofs */
62229162d606SStefano Zampini           start_rows = &constraints_idxs[constraints_idxs_ptr[total_counts]];
6223984c4197SStefano Zampini           /* insert cols for primal dofs */
6224984c4197SStefano Zampini           for (j=0;j<primal_dofs;j++) {
6225984c4197SStefano Zampini             start_vals = &qr_basis[j*size_of_constraint];
62269162d606SStefano Zampini             start_cols = &constraints_idxs[constraints_idxs_ptr[total_counts]+j];
6227906d46d4SStefano Zampini             ierr = MatSetValues(localChangeOfBasisMatrix,size_of_constraint,start_rows,1,start_cols,start_vals,INSERT_VALUES);CHKERRQ(ierr);
6228984c4197SStefano Zampini           }
6229984c4197SStefano Zampini           /* insert cols for dual dofs */
6230984c4197SStefano Zampini           for (j=0,k=0;j<dual_dofs;k++) {
62319162d606SStefano Zampini             if (!PetscBTLookup(is_primal,constraints_idxs_B[constraints_idxs_ptr[total_counts]+k])) {
6232984c4197SStefano Zampini               start_vals = &qr_basis[(primal_dofs+j)*size_of_constraint];
62339162d606SStefano Zampini               start_cols = &constraints_idxs[constraints_idxs_ptr[total_counts]+k];
6234906d46d4SStefano Zampini               ierr = MatSetValues(localChangeOfBasisMatrix,size_of_constraint,start_rows,1,start_cols,start_vals,INSERT_VALUES);CHKERRQ(ierr);
6235984c4197SStefano Zampini               j++;
6236674ae819SStefano Zampini             }
6237674ae819SStefano Zampini           }
6238984c4197SStefano Zampini 
6239984c4197SStefano Zampini           /* check change of basis */
6240984c4197SStefano Zampini           if (pcbddc->dbg_flag) {
6241984c4197SStefano Zampini             PetscInt   ii,jj;
6242984c4197SStefano Zampini             PetscBool valid_qr=PETSC_TRUE;
6243c4303822SStefano Zampini             ierr = PetscBLASIntCast(primal_dofs,&Blas_M);CHKERRQ(ierr);
6244c4303822SStefano Zampini             ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr);
6245c4303822SStefano Zampini             ierr = PetscBLASIntCast(size_of_constraint,&Blas_K);CHKERRQ(ierr);
6246c4303822SStefano Zampini             ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr);
6247c4303822SStefano Zampini             ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDB);CHKERRQ(ierr);
6248c4303822SStefano Zampini             ierr = PetscBLASIntCast(primal_dofs,&Blas_LDC);CHKERRQ(ierr);
6249984c4197SStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
6250cf5a6209SStefano Zampini             PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&Blas_M,&Blas_N,&Blas_K,&one,dbg_work,&Blas_LDA,qr_basis,&Blas_LDB,&zero,&dbg_work[size_of_constraint*primal_dofs],&Blas_LDC));
6251984c4197SStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
6252984c4197SStefano Zampini             for (jj=0;jj<size_of_constraint;jj++) {
6253984c4197SStefano Zampini               for (ii=0;ii<primal_dofs;ii++) {
6254cf5a6209SStefano Zampini                 if (ii != jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]) > 1.e-12) valid_qr = PETSC_FALSE;
6255cf5a6209SStefano Zampini                 if (ii == jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]-1.0) > 1.e-12) valid_qr = PETSC_FALSE;
6256674ae819SStefano Zampini               }
6257674ae819SStefano Zampini             }
6258984c4197SStefano Zampini             if (!valid_qr) {
625922d5777bSStefano Zampini               ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> wrong change of basis!\n");CHKERRQ(ierr);
6260984c4197SStefano Zampini               for (jj=0;jj<size_of_constraint;jj++) {
6261984c4197SStefano Zampini                 for (ii=0;ii<primal_dofs;ii++) {
6262cf5a6209SStefano Zampini                   if (ii != jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]) > 1.e-12) {
6263cf5a6209SStefano Zampini                     PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\tQr basis function %d is not orthogonal to constraint %d (%1.14e)!\n",jj,ii,PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]));
6264674ae819SStefano Zampini                   }
6265cf5a6209SStefano Zampini                   if (ii == jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]-1.0) > 1.e-12) {
6266cf5a6209SStefano Zampini                     PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\tQr basis function %d is not unitary w.r.t constraint %d (%1.14e)!\n",jj,ii,PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]));
6267984c4197SStefano Zampini                   }
6268984c4197SStefano Zampini                 }
6269984c4197SStefano Zampini               }
6270674ae819SStefano Zampini             } else {
627122d5777bSStefano Zampini               ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> right change of basis!\n");CHKERRQ(ierr);
6272674ae819SStefano Zampini             }
6273674ae819SStefano Zampini           }
6274a717540cSStefano Zampini         } else { /* simple transformation block */
6275a717540cSStefano Zampini           PetscInt    row,col;
6276a6b551f4SStefano Zampini           PetscScalar val,norm;
6277a6b551f4SStefano Zampini 
6278a6b551f4SStefano Zampini           ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr);
62799162d606SStefano Zampini           PetscStackCallBLAS("BLASdot",norm = BLASdot_(&Blas_N,constraints_data+constraints_data_ptr[total_counts],&Blas_one,constraints_data+constraints_data_ptr[total_counts],&Blas_one));
6280a717540cSStefano Zampini           for (j=0;j<size_of_constraint;j++) {
62819162d606SStefano Zampini             PetscInt row_B = constraints_idxs_B[constraints_idxs_ptr[total_counts]+j];
62829162d606SStefano Zampini             row = constraints_idxs[constraints_idxs_ptr[total_counts]+j];
6283bbb9e6c6SStefano Zampini             if (!PetscBTLookup(is_primal,row_B)) {
62849162d606SStefano Zampini               col = constraints_idxs[constraints_idxs_ptr[total_counts]];
6285906d46d4SStefano Zampini               ierr = MatSetValue(localChangeOfBasisMatrix,row,row,1.0,INSERT_VALUES);CHKERRQ(ierr);
62869162d606SStefano Zampini               ierr = MatSetValue(localChangeOfBasisMatrix,row,col,constraints_data[constraints_data_ptr[total_counts]+j]/norm,INSERT_VALUES);CHKERRQ(ierr);
6287a717540cSStefano Zampini             } else {
6288a717540cSStefano Zampini               for (k=0;k<size_of_constraint;k++) {
62899162d606SStefano Zampini                 col = constraints_idxs[constraints_idxs_ptr[total_counts]+k];
6290a717540cSStefano Zampini                 if (row != col) {
62919162d606SStefano Zampini                   val = -constraints_data[constraints_data_ptr[total_counts]+k]/constraints_data[constraints_data_ptr[total_counts]];
6292a717540cSStefano Zampini                 } else {
62939162d606SStefano Zampini                   val = constraints_data[constraints_data_ptr[total_counts]]/norm;
6294a717540cSStefano Zampini                 }
6295906d46d4SStefano Zampini                 ierr = MatSetValue(localChangeOfBasisMatrix,row,col,val,INSERT_VALUES);CHKERRQ(ierr);
6296a717540cSStefano Zampini               }
6297a717540cSStefano Zampini             }
6298a717540cSStefano Zampini           }
629998a51de6SStefano Zampini           if (pcbddc->dbg_flag) {
630022d5777bSStefano Zampini             ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> using standard change of basis\n");CHKERRQ(ierr);
6301a717540cSStefano Zampini           }
6302674ae819SStefano Zampini         }
6303984c4197SStefano Zampini       } else {
6304984c4197SStefano Zampini         if (pcbddc->dbg_flag) {
63059162d606SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Constraint %d does not need a change of basis (size %d)\n",total_counts,size_of_constraint);CHKERRQ(ierr);
6306674ae819SStefano Zampini         }
6307674ae819SStefano Zampini       }
6308674ae819SStefano Zampini     }
6309a717540cSStefano Zampini 
6310a717540cSStefano Zampini     /* free workspace */
6311a717540cSStefano Zampini     if (qr_needed) {
6312984c4197SStefano Zampini       if (pcbddc->dbg_flag) {
6313cf5a6209SStefano Zampini         ierr = PetscFree(dbg_work);CHKERRQ(ierr);
6314984c4197SStefano Zampini       }
6315984c4197SStefano Zampini       ierr = PetscFree(trs_rhs);CHKERRQ(ierr);
6316984c4197SStefano Zampini       ierr = PetscFree(qr_tau);CHKERRQ(ierr);
6317984c4197SStefano Zampini       ierr = PetscFree(qr_work);CHKERRQ(ierr);
6318984c4197SStefano Zampini       ierr = PetscFree(gqr_work);CHKERRQ(ierr);
6319984c4197SStefano Zampini       ierr = PetscFree(qr_basis);CHKERRQ(ierr);
6320674ae819SStefano Zampini     }
6321a717540cSStefano Zampini     ierr = PetscBTDestroy(&is_primal);CHKERRQ(ierr);
6322906d46d4SStefano Zampini     ierr = MatAssemblyBegin(localChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6323906d46d4SStefano Zampini     ierr = MatAssemblyEnd(localChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6324906d46d4SStefano Zampini 
6325906d46d4SStefano Zampini     /* assembling of global change of variable */
632688c03ad3SStefano Zampini     if (!pcbddc->fake_change) {
6327bbb9e6c6SStefano Zampini       Mat      tmat;
632816f15bc4SStefano Zampini       PetscInt bs;
632916f15bc4SStefano Zampini 
6330906d46d4SStefano Zampini       ierr = VecGetSize(pcis->vec1_global,&global_size);CHKERRQ(ierr);
6331906d46d4SStefano Zampini       ierr = VecGetLocalSize(pcis->vec1_global,&local_size);CHKERRQ(ierr);
6332bbb9e6c6SStefano Zampini       ierr = MatDuplicate(pc->pmat,MAT_DO_NOT_COPY_VALUES,&tmat);CHKERRQ(ierr);
6333bbb9e6c6SStefano Zampini       ierr = MatISSetLocalMat(tmat,localChangeOfBasisMatrix);CHKERRQ(ierr);
6334bbb9e6c6SStefano Zampini       ierr = MatCreate(PetscObjectComm((PetscObject)pc),&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
6335bbb9e6c6SStefano Zampini       ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,MATAIJ);CHKERRQ(ierr);
633616f15bc4SStefano Zampini       ierr = MatGetBlockSize(pc->pmat,&bs);CHKERRQ(ierr);
633716f15bc4SStefano Zampini       ierr = MatSetBlockSize(pcbddc->ChangeOfBasisMatrix,bs);CHKERRQ(ierr);
6338906d46d4SStefano Zampini       ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,local_size,local_size,global_size,global_size);CHKERRQ(ierr);
6339bbb9e6c6SStefano Zampini       ierr = MatISSetMPIXAIJPreallocation_Private(tmat,pcbddc->ChangeOfBasisMatrix,PETSC_TRUE);CHKERRQ(ierr);
6340bbb9e6c6SStefano Zampini       ierr = MatISGetMPIXAIJ(tmat,MAT_REUSE_MATRIX,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
6341bbb9e6c6SStefano Zampini       ierr = MatDestroy(&tmat);CHKERRQ(ierr);
6342bbb9e6c6SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
6343bbb9e6c6SStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
6344e176bc59SStefano Zampini       ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6345e176bc59SStefano Zampini       ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6346bbb9e6c6SStefano Zampini       ierr = VecReciprocal(pcis->vec1_global);CHKERRQ(ierr);
6347bbb9e6c6SStefano Zampini       ierr = MatDiagonalScale(pcbddc->ChangeOfBasisMatrix,pcis->vec1_global,NULL);CHKERRQ(ierr);
634888c03ad3SStefano Zampini 
6349906d46d4SStefano Zampini       /* check */
6350906d46d4SStefano Zampini       if (pcbddc->dbg_flag) {
6351906d46d4SStefano Zampini         PetscReal error;
6352906d46d4SStefano Zampini         Vec       x,x_change;
6353906d46d4SStefano Zampini 
6354906d46d4SStefano Zampini         ierr = VecDuplicate(pcis->vec1_global,&x);CHKERRQ(ierr);
6355906d46d4SStefano Zampini         ierr = VecDuplicate(pcis->vec1_global,&x_change);CHKERRQ(ierr);
6356906d46d4SStefano Zampini         ierr = VecSetRandom(x,NULL);CHKERRQ(ierr);
6357906d46d4SStefano Zampini         ierr = VecCopy(x,pcis->vec1_global);CHKERRQ(ierr);
6358e176bc59SStefano Zampini         ierr = VecScatterBegin(matis->rctx,x,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6359e176bc59SStefano Zampini         ierr = VecScatterEnd(matis->rctx,x,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6360bbb9e6c6SStefano Zampini         ierr = MatMult(localChangeOfBasisMatrix,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
6361e176bc59SStefano Zampini         ierr = VecScatterBegin(matis->rctx,pcis->vec2_N,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6362e176bc59SStefano Zampini         ierr = VecScatterEnd(matis->rctx,pcis->vec2_N,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6363906d46d4SStefano Zampini         ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_global,x_change);CHKERRQ(ierr);
6364906d46d4SStefano Zampini         ierr = VecAXPY(x,-1.0,x_change);CHKERRQ(ierr);
6365906d46d4SStefano Zampini         ierr = VecNorm(x,NORM_INFINITY,&error);CHKERRQ(ierr);
6366637e8532SStefano Zampini         if (error > PETSC_SMALL) {
6367637e8532SStefano Zampini           SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on N: %1.6e\n",error);
6368637e8532SStefano Zampini         }
6369906d46d4SStefano Zampini         ierr = VecDestroy(&x);CHKERRQ(ierr);
6370906d46d4SStefano Zampini         ierr = VecDestroy(&x_change);CHKERRQ(ierr);
6371906d46d4SStefano Zampini       }
6372b96c3477SStefano Zampini       /* adapt sub_schurs computed (if any) */
6373b96c3477SStefano Zampini       if (pcbddc->use_deluxe_scaling) {
6374b96c3477SStefano Zampini         PCBDDCSubSchurs sub_schurs=pcbddc->sub_schurs;
6375bf3a8328SStefano Zampini 
637613903a91SSatish Balay         if (pcbddc->use_change_of_basis && pcbddc->adaptive_userdefined) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Cannot mix automatic change of basis, adaptive selection and user-defined constraints");
6377b334f244SStefano Zampini         if (sub_schurs && sub_schurs->S_Ej_all) {
6378ac632422SStefano Zampini           Mat                    S_new,tmat;
6379bf3a8328SStefano Zampini           IS                     is_all_N,is_V_Sall = NULL;
6380bbb9e6c6SStefano Zampini 
6381bbb9e6c6SStefano Zampini           ierr = ISLocalToGlobalMappingApplyIS(pcis->BtoNmap,sub_schurs->is_Ej_all,&is_all_N);CHKERRQ(ierr);
63827dae84e0SHong Zhang           ierr = MatCreateSubMatrix(localChangeOfBasisMatrix,is_all_N,is_all_N,MAT_INITIAL_MATRIX,&tmat);CHKERRQ(ierr);
6383bf3a8328SStefano Zampini           if (pcbddc->deluxe_zerorows) {
6384bf3a8328SStefano Zampini             ISLocalToGlobalMapping NtoSall;
6385bf3a8328SStefano Zampini             IS                     is_V;
6386b087196eSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->n_vertices,pcbddc->local_primal_ref_node,PETSC_COPY_VALUES,&is_V);CHKERRQ(ierr);
6387b087196eSStefano Zampini             ierr = ISLocalToGlobalMappingCreateIS(is_all_N,&NtoSall);CHKERRQ(ierr);
6388b087196eSStefano Zampini             ierr = ISGlobalToLocalMappingApplyIS(NtoSall,IS_GTOLM_DROP,is_V,&is_V_Sall);CHKERRQ(ierr);
6389b087196eSStefano Zampini             ierr = ISLocalToGlobalMappingDestroy(&NtoSall);CHKERRQ(ierr);
6390b087196eSStefano Zampini             ierr = ISDestroy(&is_V);CHKERRQ(ierr);
6391bf3a8328SStefano Zampini           }
6392bf3a8328SStefano Zampini           ierr = ISDestroy(&is_all_N);CHKERRQ(ierr);
6393ac632422SStefano Zampini           ierr = MatPtAP(sub_schurs->S_Ej_all,tmat,MAT_INITIAL_MATRIX,1.0,&S_new);CHKERRQ(ierr);
6394b96c3477SStefano Zampini           ierr = MatDestroy(&sub_schurs->S_Ej_all);CHKERRQ(ierr);
6395ac632422SStefano Zampini           ierr = PetscObjectReference((PetscObject)S_new);CHKERRQ(ierr);
6396bf3a8328SStefano Zampini           if (pcbddc->deluxe_zerorows) {
6397bf3a8328SStefano Zampini             const PetscScalar *array;
6398bf3a8328SStefano Zampini             const PetscInt    *idxs_V,*idxs_all;
6399bf3a8328SStefano Zampini             PetscInt          i,n_V;
6400bf3a8328SStefano Zampini 
6401b087196eSStefano Zampini             ierr = MatZeroRowsColumnsIS(S_new,is_V_Sall,1.,NULL,NULL);CHKERRQ(ierr);
6402b087196eSStefano Zampini             ierr = ISGetLocalSize(is_V_Sall,&n_V);CHKERRQ(ierr);
6403b087196eSStefano Zampini             ierr = ISGetIndices(is_V_Sall,&idxs_V);CHKERRQ(ierr);
6404b087196eSStefano Zampini             ierr = ISGetIndices(sub_schurs->is_Ej_all,&idxs_all);CHKERRQ(ierr);
6405b087196eSStefano Zampini             ierr = VecGetArrayRead(pcis->D,&array);CHKERRQ(ierr);
6406b087196eSStefano Zampini             for (i=0;i<n_V;i++) {
6407b087196eSStefano Zampini               PetscScalar val;
6408b087196eSStefano Zampini               PetscInt    idx;
6409b087196eSStefano Zampini 
6410b087196eSStefano Zampini               idx = idxs_V[i];
6411b087196eSStefano Zampini               val = array[idxs_all[idxs_V[i]]];
6412b087196eSStefano Zampini               ierr = MatSetValue(S_new,idx,idx,val,INSERT_VALUES);CHKERRQ(ierr);
6413b087196eSStefano Zampini             }
6414b087196eSStefano Zampini             ierr = MatAssemblyBegin(S_new,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6415b087196eSStefano Zampini             ierr = MatAssemblyEnd(S_new,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6416bf3a8328SStefano Zampini             ierr = VecRestoreArrayRead(pcis->D,&array);CHKERRQ(ierr);
6417bf3a8328SStefano Zampini             ierr = ISRestoreIndices(sub_schurs->is_Ej_all,&idxs_all);CHKERRQ(ierr);
6418bf3a8328SStefano Zampini             ierr = ISRestoreIndices(is_V_Sall,&idxs_V);CHKERRQ(ierr);
6419bf3a8328SStefano Zampini           }
6420ac632422SStefano Zampini           sub_schurs->S_Ej_all = S_new;
6421ac632422SStefano Zampini           ierr = MatDestroy(&S_new);CHKERRQ(ierr);
6422ac632422SStefano Zampini           if (sub_schurs->sum_S_Ej_all) {
6423ac632422SStefano Zampini             ierr = MatPtAP(sub_schurs->sum_S_Ej_all,tmat,MAT_INITIAL_MATRIX,1.0,&S_new);CHKERRQ(ierr);
6424b96c3477SStefano Zampini             ierr = MatDestroy(&sub_schurs->sum_S_Ej_all);CHKERRQ(ierr);
6425ac632422SStefano Zampini             ierr = PetscObjectReference((PetscObject)S_new);CHKERRQ(ierr);
6426bf3a8328SStefano Zampini             if (pcbddc->deluxe_zerorows) {
6427b087196eSStefano Zampini               ierr = MatZeroRowsColumnsIS(S_new,is_V_Sall,1.,NULL,NULL);CHKERRQ(ierr);
6428bf3a8328SStefano Zampini             }
6429ac632422SStefano Zampini             sub_schurs->sum_S_Ej_all = S_new;
6430ac632422SStefano Zampini             ierr = MatDestroy(&S_new);CHKERRQ(ierr);
6431ac632422SStefano Zampini           }
6432b087196eSStefano Zampini           ierr = ISDestroy(&is_V_Sall);CHKERRQ(ierr);
643388c03ad3SStefano Zampini           ierr = MatDestroy(&tmat);CHKERRQ(ierr);
6434b96c3477SStefano Zampini         }
6435c9db6a07SStefano Zampini         /* destroy any change of basis context in sub_schurs */
6436b334f244SStefano Zampini         if (sub_schurs && sub_schurs->change) {
6437c9db6a07SStefano Zampini           PetscInt i;
6438c9db6a07SStefano Zampini 
6439c9db6a07SStefano Zampini           for (i=0;i<sub_schurs->n_subs;i++) {
6440c9db6a07SStefano Zampini             ierr = KSPDestroy(&sub_schurs->change[i]);CHKERRQ(ierr);
6441c9db6a07SStefano Zampini           }
6442c9db6a07SStefano Zampini           ierr = PetscFree(sub_schurs->change);CHKERRQ(ierr);
6443c9db6a07SStefano Zampini         }
6444b96c3477SStefano Zampini       }
644516909a7fSStefano Zampini       if (pcbddc->switch_static) { /* need to save the local change */
644616909a7fSStefano Zampini         pcbddc->switch_static_change = localChangeOfBasisMatrix;
644716909a7fSStefano Zampini       } else {
6448906d46d4SStefano Zampini         ierr = MatDestroy(&localChangeOfBasisMatrix);CHKERRQ(ierr);
644916909a7fSStefano Zampini       }
64501dd7afcfSStefano Zampini       /* determine if any process has changed the pressures locally */
645127b6a85dSStefano Zampini       pcbddc->change_interior = pcbddc->benign_have_null;
645272b8c272SStefano Zampini     } else { /* fake change (get back change of basis into ConstraintMatrix and info on qr) */
645372b8c272SStefano Zampini       ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
645472b8c272SStefano Zampini       pcbddc->ConstraintMatrix = localChangeOfBasisMatrix;
645572b8c272SStefano Zampini       pcbddc->use_qr_single = qr_needed;
645672b8c272SStefano Zampini     }
64571dd7afcfSStefano Zampini   } else if (pcbddc->user_ChangeOfBasisMatrix || pcbddc->benign_saddle_point) {
645827b6a85dSStefano Zampini     if (!pcbddc->benign_have_null && pcbddc->user_ChangeOfBasisMatrix) {
6459b9b85e73SStefano Zampini       ierr = PetscObjectReference((PetscObject)pcbddc->user_ChangeOfBasisMatrix);CHKERRQ(ierr);
6460b9b85e73SStefano Zampini       pcbddc->ChangeOfBasisMatrix = pcbddc->user_ChangeOfBasisMatrix;
6461906d46d4SStefano Zampini     } else {
64621dd7afcfSStefano Zampini       Mat benign_global = NULL;
646327b6a85dSStefano Zampini       if (pcbddc->benign_have_null) {
64641dd7afcfSStefano Zampini         Mat tmat;
64651dd7afcfSStefano Zampini 
64661dd7afcfSStefano Zampini         pcbddc->change_interior = PETSC_TRUE;
64671dd7afcfSStefano Zampini         ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
64681dd7afcfSStefano Zampini         ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
64691dd7afcfSStefano Zampini         ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
64701dd7afcfSStefano Zampini         ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
64711dd7afcfSStefano Zampini         ierr = VecReciprocal(pcis->vec1_global);CHKERRQ(ierr);
64721dd7afcfSStefano Zampini         ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
64731dd7afcfSStefano Zampini         ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
64741dd7afcfSStefano Zampini         ierr = MatDuplicate(pc->pmat,MAT_DO_NOT_COPY_VALUES,&tmat);CHKERRQ(ierr);
64751dd7afcfSStefano Zampini         if (pcbddc->benign_change) {
64761dd7afcfSStefano Zampini           Mat M;
64771dd7afcfSStefano Zampini 
64781dd7afcfSStefano Zampini           ierr = MatDuplicate(pcbddc->benign_change,MAT_COPY_VALUES,&M);CHKERRQ(ierr);
64791dd7afcfSStefano Zampini           ierr = MatDiagonalScale(M,pcis->vec1_N,NULL);CHKERRQ(ierr);
64801dd7afcfSStefano Zampini           ierr = MatISSetLocalMat(tmat,M);CHKERRQ(ierr);
64811dd7afcfSStefano Zampini           ierr = MatDestroy(&M);CHKERRQ(ierr);
6482906d46d4SStefano Zampini         } else {
64831dd7afcfSStefano Zampini           Mat         eye;
64841dd7afcfSStefano Zampini           PetscScalar *array;
64851dd7afcfSStefano Zampini 
64861dd7afcfSStefano Zampini           ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
64871dd7afcfSStefano Zampini           ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,pcis->n,pcis->n,1,NULL,&eye);CHKERRQ(ierr);
64881dd7afcfSStefano Zampini           for (i=0;i<pcis->n;i++) {
64891dd7afcfSStefano Zampini             ierr = MatSetValue(eye,i,i,array[i],INSERT_VALUES);CHKERRQ(ierr);
6490906d46d4SStefano Zampini           }
64911dd7afcfSStefano Zampini           ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
64921dd7afcfSStefano Zampini           ierr = MatAssemblyBegin(eye,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
64931dd7afcfSStefano Zampini           ierr = MatAssemblyEnd(eye,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
64941dd7afcfSStefano Zampini           ierr = MatISSetLocalMat(tmat,eye);CHKERRQ(ierr);
64951dd7afcfSStefano Zampini           ierr = MatDestroy(&eye);CHKERRQ(ierr);
64961dd7afcfSStefano Zampini         }
64971dd7afcfSStefano Zampini         ierr = MatISGetMPIXAIJ(tmat,MAT_INITIAL_MATRIX,&benign_global);CHKERRQ(ierr);
64981dd7afcfSStefano Zampini         ierr = MatDestroy(&tmat);CHKERRQ(ierr);
64991dd7afcfSStefano Zampini       }
65001dd7afcfSStefano Zampini       if (pcbddc->user_ChangeOfBasisMatrix) {
65011dd7afcfSStefano Zampini         ierr = MatMatMult(pcbddc->user_ChangeOfBasisMatrix,benign_global,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
65021dd7afcfSStefano Zampini         ierr = MatDestroy(&benign_global);CHKERRQ(ierr);
650327b6a85dSStefano Zampini       } else if (pcbddc->benign_have_null) {
65041dd7afcfSStefano Zampini         pcbddc->ChangeOfBasisMatrix = benign_global;
65051dd7afcfSStefano Zampini       }
65061dd7afcfSStefano Zampini     }
650716909a7fSStefano Zampini     if (pcbddc->switch_static && pcbddc->ChangeOfBasisMatrix) { /* need to save the local change */
650816909a7fSStefano Zampini       IS             is_global;
650916909a7fSStefano Zampini       const PetscInt *gidxs;
651016909a7fSStefano Zampini 
651116909a7fSStefano Zampini       ierr = ISLocalToGlobalMappingGetIndices(pc->pmat->rmap->mapping,&gidxs);CHKERRQ(ierr);
651216909a7fSStefano Zampini       ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),pcis->n,gidxs,PETSC_COPY_VALUES,&is_global);CHKERRQ(ierr);
651316909a7fSStefano Zampini       ierr = ISLocalToGlobalMappingRestoreIndices(pc->pmat->rmap->mapping,&gidxs);CHKERRQ(ierr);
65147dae84e0SHong Zhang       ierr = MatCreateSubMatrixUnsorted(pcbddc->ChangeOfBasisMatrix,is_global,is_global,&pcbddc->switch_static_change);CHKERRQ(ierr);
651516909a7fSStefano Zampini       ierr = ISDestroy(&is_global);CHKERRQ(ierr);
651616909a7fSStefano Zampini     }
65171dd7afcfSStefano Zampini   }
65181dd7afcfSStefano Zampini   if (!pcbddc->fake_change && pcbddc->ChangeOfBasisMatrix && !pcbddc->work_change) {
65191dd7afcfSStefano Zampini     ierr = VecDuplicate(pcis->vec1_global,&pcbddc->work_change);CHKERRQ(ierr);
6520b9b85e73SStefano Zampini   }
6521a717540cSStefano Zampini 
652272b8c272SStefano Zampini   if (!pcbddc->fake_change) {
65234f1b2e48SStefano Zampini     /* add pressure dofs to set of primal nodes for numbering purposes */
65244f1b2e48SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) {
65254f1b2e48SStefano Zampini       pcbddc->local_primal_ref_node[pcbddc->local_primal_size_cc] = pcbddc->benign_p0_lidx[i];
65264f1b2e48SStefano Zampini       pcbddc->primal_indices_local_idxs[pcbddc->local_primal_size] = pcbddc->benign_p0_lidx[i];
6527019a44ceSStefano Zampini       pcbddc->local_primal_ref_mult[pcbddc->local_primal_size_cc] = 1;
6528019a44ceSStefano Zampini       pcbddc->local_primal_size_cc++;
6529019a44ceSStefano Zampini       pcbddc->local_primal_size++;
6530019a44ceSStefano Zampini     }
6531019a44ceSStefano Zampini 
6532019a44ceSStefano Zampini     /* check if a new primal space has been introduced (also take into account benign trick) */
6533727cdba6SStefano Zampini     pcbddc->new_primal_space_local = PETSC_TRUE;
6534727cdba6SStefano Zampini     if (olocal_primal_size == pcbddc->local_primal_size) {
65359f47a83aSStefano Zampini       ierr = PetscMemcmp(pcbddc->local_primal_ref_node,olocal_primal_ref_node,olocal_primal_size_cc*sizeof(PetscInt),&pcbddc->new_primal_space_local);CHKERRQ(ierr);
6536c1c8e736SStefano Zampini       pcbddc->new_primal_space_local = (PetscBool)(!pcbddc->new_primal_space_local);
65370e6343abSStefano Zampini       if (!pcbddc->new_primal_space_local) {
65389f47a83aSStefano Zampini         ierr = PetscMemcmp(pcbddc->local_primal_ref_mult,olocal_primal_ref_mult,olocal_primal_size_cc*sizeof(PetscInt),&pcbddc->new_primal_space_local);CHKERRQ(ierr);
6539727cdba6SStefano Zampini         pcbddc->new_primal_space_local = (PetscBool)(!pcbddc->new_primal_space_local);
6540727cdba6SStefano Zampini       }
65410e6343abSStefano Zampini     }
6542727cdba6SStefano Zampini     /* new_primal_space will be used for numbering of coarse dofs, so it should be the same across all subdomains */
6543b2566f29SBarry Smith     ierr = MPIU_Allreduce(&pcbddc->new_primal_space_local,&pcbddc->new_primal_space,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
654472b8c272SStefano Zampini   }
654572b8c272SStefano Zampini   ierr = PetscFree2(olocal_primal_ref_node,olocal_primal_ref_mult);CHKERRQ(ierr);
6546727cdba6SStefano Zampini 
6547a717540cSStefano Zampini   /* flush dbg viewer */
6548b8ffe317SStefano Zampini   if (pcbddc->dbg_flag) {
6549b8ffe317SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
6550b8ffe317SStefano Zampini   }
6551a717540cSStefano Zampini 
6552e310c8b4SStefano Zampini   /* free workspace */
6553a717540cSStefano Zampini   ierr = PetscBTDestroy(&qr_needed_idx);CHKERRQ(ierr);
65544641a718SStefano Zampini   ierr = PetscBTDestroy(&change_basis);CHKERRQ(ierr);
655508122e43SStefano Zampini   if (!pcbddc->adaptive_selection) {
65569162d606SStefano Zampini     ierr = PetscFree3(constraints_idxs_ptr,constraints_data_ptr,constraints_n);CHKERRQ(ierr);
65579162d606SStefano Zampini     ierr = PetscFree3(constraints_data,constraints_idxs,constraints_idxs_B);CHKERRQ(ierr);
655808122e43SStefano Zampini   } else {
65599162d606SStefano Zampini     ierr = PetscFree5(pcbddc->adaptive_constraints_n,
65609162d606SStefano Zampini                       pcbddc->adaptive_constraints_idxs_ptr,
65619162d606SStefano Zampini                       pcbddc->adaptive_constraints_data_ptr,
656208122e43SStefano Zampini                       pcbddc->adaptive_constraints_idxs,
656308122e43SStefano Zampini                       pcbddc->adaptive_constraints_data);CHKERRQ(ierr);
65649162d606SStefano Zampini     ierr = PetscFree(constraints_n);CHKERRQ(ierr);
65659162d606SStefano Zampini     ierr = PetscFree(constraints_idxs_B);CHKERRQ(ierr);
656608122e43SStefano Zampini   }
6567674ae819SStefano Zampini   PetscFunctionReturn(0);
6568674ae819SStefano Zampini }
6569674ae819SStefano Zampini 
6570674ae819SStefano Zampini PetscErrorCode PCBDDCAnalyzeInterface(PC pc)
6571674ae819SStefano Zampini {
657271582508SStefano Zampini   ISLocalToGlobalMapping map;
6573674ae819SStefano Zampini   PC_BDDC                *pcbddc = (PC_BDDC*)pc->data;
6574674ae819SStefano Zampini   Mat_IS                 *matis  = (Mat_IS*)pc->pmat->data;
657566da6bd7Sstefano_zampini   PetscInt               i,N;
657666da6bd7Sstefano_zampini   PetscBool              rcsr = PETSC_FALSE;
657766da6bd7Sstefano_zampini   PetscErrorCode         ierr;
6578674ae819SStefano Zampini 
6579674ae819SStefano Zampini   PetscFunctionBegin;
65808af8fcf9SStefano Zampini   if (pcbddc->recompute_topography) {
6581b03ebc13SStefano Zampini     pcbddc->graphanalyzed = PETSC_FALSE;
65828e61c736SStefano Zampini     /* Reset previously computed graph */
65838e61c736SStefano Zampini     ierr = PCBDDCGraphReset(pcbddc->mat_graph);CHKERRQ(ierr);
6584674ae819SStefano Zampini     /* Init local Graph struct */
65857fb0e2dbSStefano Zampini     ierr = MatGetSize(pc->pmat,&N,NULL);CHKERRQ(ierr);
658671582508SStefano Zampini     ierr = MatGetLocalToGlobalMapping(pc->pmat,&map,NULL);CHKERRQ(ierr);
6587be12c134Sstefano_zampini     ierr = PCBDDCGraphInit(pcbddc->mat_graph,map,N,pcbddc->graphmaxcount);CHKERRQ(ierr);
6588674ae819SStefano Zampini 
65897a0e7b2cSstefano_zampini     if (pcbddc->user_primal_vertices_local && !pcbddc->user_primal_vertices) {
65907a0e7b2cSstefano_zampini       ierr = PCBDDCConsistencyCheckIS(pc,MPI_LOR,&pcbddc->user_primal_vertices_local);CHKERRQ(ierr);
65917a0e7b2cSstefano_zampini     }
6592575ad6abSStefano Zampini     /* Check validity of the csr graph passed in by the user */
65939a962809SStefano Zampini     if (pcbddc->mat_graph->nvtxs_csr && pcbddc->mat_graph->nvtxs_csr != pcbddc->mat_graph->nvtxs) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Invalid size of local CSR graph! Found %d, expected %d\n",pcbddc->mat_graph->nvtxs_csr,pcbddc->mat_graph->nvtxs);
65949577ea80SStefano Zampini 
6595674ae819SStefano Zampini     /* Set default CSR adjacency of local dofs if not provided by the user with PCBDDCSetLocalAdjacencyGraph */
659666da6bd7Sstefano_zampini     if (!pcbddc->mat_graph->xadj && pcbddc->use_local_adj) {
65974d379d7bSStefano Zampini       PetscInt  *xadj,*adjncy;
65984d379d7bSStefano Zampini       PetscInt  nvtxs;
6599e496cd5dSStefano Zampini       PetscBool flg_row=PETSC_FALSE;
6600674ae819SStefano Zampini 
66012fffb893SStefano Zampini       ierr = MatGetRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr);
66022fffb893SStefano Zampini       if (flg_row) {
66034d379d7bSStefano Zampini         ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
6604b96c3477SStefano Zampini         pcbddc->computed_rowadj = PETSC_TRUE;
66052fffb893SStefano Zampini       }
66062fffb893SStefano Zampini       ierr = MatRestoreRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr);
660766da6bd7Sstefano_zampini       rcsr = PETSC_TRUE;
6608674ae819SStefano Zampini     }
66099b28b941SStefano Zampini     if (pcbddc->dbg_flag) {
66109b28b941SStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
6611674ae819SStefano Zampini     }
6612674ae819SStefano Zampini 
6613674ae819SStefano Zampini     /* Setup of Graph */
66144b2aedd3SStefano Zampini     pcbddc->mat_graph->commsizelimit = 0; /* don't use the COMM_SELF variant of the graph */
661514f95afaSStefano Zampini     ierr = PCBDDCGraphSetUp(pcbddc->mat_graph,pcbddc->vertex_size,pcbddc->NeumannBoundariesLocal,pcbddc->DirichletBoundariesLocal,pcbddc->n_ISForDofsLocal,pcbddc->ISForDofsLocal,pcbddc->user_primal_vertices_local);CHKERRQ(ierr);
6616674ae819SStefano Zampini 
66174f1b2e48SStefano Zampini     /* attach info on disconnected subdomains if present */
66184f1b2e48SStefano Zampini     if (pcbddc->n_local_subs) {
66194f1b2e48SStefano Zampini       PetscInt *local_subs;
66204f1b2e48SStefano Zampini 
66214f1b2e48SStefano Zampini       ierr = PetscMalloc1(N,&local_subs);CHKERRQ(ierr);
66224f1b2e48SStefano Zampini       for (i=0;i<pcbddc->n_local_subs;i++) {
66234f1b2e48SStefano Zampini         const PetscInt *idxs;
66244f1b2e48SStefano Zampini         PetscInt       nl,j;
66254f1b2e48SStefano Zampini 
66264f1b2e48SStefano Zampini         ierr = ISGetLocalSize(pcbddc->local_subs[i],&nl);CHKERRQ(ierr);
66274f1b2e48SStefano Zampini         ierr = ISGetIndices(pcbddc->local_subs[i],&idxs);CHKERRQ(ierr);
662871582508SStefano Zampini         for (j=0;j<nl;j++) local_subs[idxs[j]] = i;
66294f1b2e48SStefano Zampini         ierr = ISRestoreIndices(pcbddc->local_subs[i],&idxs);CHKERRQ(ierr);
66304f1b2e48SStefano Zampini       }
66314f1b2e48SStefano Zampini       pcbddc->mat_graph->n_local_subs = pcbddc->n_local_subs;
66324f1b2e48SStefano Zampini       pcbddc->mat_graph->local_subs = local_subs;
66334f1b2e48SStefano Zampini     }
66348af8fcf9SStefano Zampini   }
66354f1b2e48SStefano Zampini 
6636cac5312eSStefano Zampini   if (!pcbddc->graphanalyzed) {
6637674ae819SStefano Zampini     /* Graph's connected components analysis */
6638674ae819SStefano Zampini     ierr = PCBDDCGraphComputeConnectedComponents(pcbddc->mat_graph);CHKERRQ(ierr);
663971582508SStefano Zampini     pcbddc->graphanalyzed = PETSC_TRUE;
66408af8fcf9SStefano Zampini   }
664166da6bd7Sstefano_zampini   if (rcsr) pcbddc->mat_graph->nvtxs_csr = 0;
6642674ae819SStefano Zampini   PetscFunctionReturn(0);
6643674ae819SStefano Zampini }
6644674ae819SStefano Zampini 
66459a7d3425SStefano Zampini PetscErrorCode PCBDDCOrthonormalizeVecs(PetscInt n, Vec vecs[])
66469a7d3425SStefano Zampini {
66479a7d3425SStefano Zampini   PetscInt       i,j;
66489a7d3425SStefano Zampini   PetscScalar    *alphas;
66499a7d3425SStefano Zampini   PetscErrorCode ierr;
66509a7d3425SStefano Zampini 
66519a7d3425SStefano Zampini   PetscFunctionBegin;
6652785e854fSJed Brown   ierr = PetscMalloc1(n,&alphas);CHKERRQ(ierr);
66539a7d3425SStefano Zampini   for (i=0;i<n;i++) {
66549a7d3425SStefano Zampini     ierr = VecNormalize(vecs[i],NULL);CHKERRQ(ierr);
6655669cc0f4SStefano Zampini     ierr = VecMDot(vecs[i],n-i-1,&vecs[i+1],alphas);CHKERRQ(ierr);
6656669cc0f4SStefano Zampini     for (j=0;j<n-i-1;j++) alphas[j] = PetscConj(-alphas[j]);
6657669cc0f4SStefano Zampini     ierr = VecMAXPY(vecs[j],n-i-1,alphas,vecs+i);CHKERRQ(ierr);
66589a7d3425SStefano Zampini   }
66599a7d3425SStefano Zampini   ierr = PetscFree(alphas);CHKERRQ(ierr);
66609a7d3425SStefano Zampini   PetscFunctionReturn(0);
66619a7d3425SStefano Zampini }
66629a7d3425SStefano Zampini 
6663bb360cb4SStefano Zampini PetscErrorCode PCBDDCMatISGetSubassemblingPattern(Mat mat, PetscInt *n_subdomains, PetscInt redprocs, IS* is_sends, PetscBool *have_void)
6664e7931f94SStefano Zampini {
666557de7509SStefano Zampini   Mat            A;
6666e7931f94SStefano Zampini   PetscInt       n_neighs,*neighs,*n_shared,**shared;
6667e7931f94SStefano Zampini   PetscMPIInt    size,rank,color;
666852e5ac9dSStefano Zampini   PetscInt       *xadj,*adjncy;
666952e5ac9dSStefano Zampini   PetscInt       *adjncy_wgt,*v_wgt,*ranks_send_to_idx;
6670bb360cb4SStefano Zampini   PetscInt       im_active,active_procs,N,n,i,j,threshold = 2;
667157de7509SStefano Zampini   PetscInt       void_procs,*procs_candidates = NULL;
667227b6a85dSStefano Zampini   PetscInt       xadj_count,*count;
667327b6a85dSStefano Zampini   PetscBool      ismatis,use_vwgt=PETSC_FALSE;
667427b6a85dSStefano Zampini   PetscSubcomm   psubcomm;
667527b6a85dSStefano Zampini   MPI_Comm       subcomm;
667652e5ac9dSStefano Zampini   PetscErrorCode ierr;
6677a57a6d2fSStefano Zampini 
6678e7931f94SStefano Zampini   PetscFunctionBegin;
667957de7509SStefano Zampini   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
668057de7509SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)mat,MATIS,&ismatis);CHKERRQ(ierr);
6681fbfcfee5SBarry Smith   if (!ismatis) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot use %s on a matrix object which is not of type MATIS",PETSC_FUNCTION_NAME);
668257de7509SStefano Zampini   PetscValidLogicalCollectiveInt(mat,*n_subdomains,2);
668357de7509SStefano Zampini   PetscValidLogicalCollectiveInt(mat,redprocs,3);
668457de7509SStefano Zampini   if (*n_subdomains <=0) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_WRONG,"Invalid number of subdomains requested %d\n",*n_subdomains);
668557de7509SStefano Zampini 
668657de7509SStefano Zampini   if (have_void) *have_void = PETSC_FALSE;
668757de7509SStefano Zampini   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)mat),&size);CHKERRQ(ierr);
668857de7509SStefano Zampini   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)mat),&rank);CHKERRQ(ierr);
668957de7509SStefano Zampini   ierr = MatISGetLocalMat(mat,&A);CHKERRQ(ierr);
669057de7509SStefano Zampini   ierr = MatGetLocalSize(A,&n,NULL);CHKERRQ(ierr);
6691bb360cb4SStefano Zampini   im_active = !!n;
669257de7509SStefano Zampini   ierr = MPIU_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr);
669357de7509SStefano Zampini   void_procs = size - active_procs;
669457de7509SStefano Zampini   /* get ranks of of non-active processes in mat communicator */
669557de7509SStefano Zampini   if (void_procs) {
669657de7509SStefano Zampini     PetscInt ncand;
669757de7509SStefano Zampini 
669857de7509SStefano Zampini     if (have_void) *have_void = PETSC_TRUE;
669957de7509SStefano Zampini     ierr = PetscMalloc1(size,&procs_candidates);CHKERRQ(ierr);
670057de7509SStefano Zampini     ierr = MPI_Allgather(&im_active,1,MPIU_INT,procs_candidates,1,MPIU_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr);
670157de7509SStefano Zampini     for (i=0,ncand=0;i<size;i++) {
670257de7509SStefano Zampini       if (!procs_candidates[i]) {
670357de7509SStefano Zampini         procs_candidates[ncand++] = i;
670457de7509SStefano Zampini       }
670557de7509SStefano Zampini     }
670657de7509SStefano Zampini     /* force n_subdomains to be not greater that the number of non-active processes */
670757de7509SStefano Zampini     *n_subdomains = PetscMin(void_procs,*n_subdomains);
670857de7509SStefano Zampini   }
670957de7509SStefano Zampini 
6710bb360cb4SStefano Zampini   /* number of subdomains requested greater than active processes or matrix size -> just shift the matrix
671114f0bfb9SStefano Zampini      number of subdomains requested 1 -> send to master or first candidate in voids  */
6712bb360cb4SStefano Zampini   ierr = MatGetSize(mat,&N,NULL);CHKERRQ(ierr);
6713bb360cb4SStefano Zampini   if (active_procs < *n_subdomains || *n_subdomains == 1 || N <= *n_subdomains) {
671414f0bfb9SStefano Zampini     PetscInt issize,isidx,dest;
671514f0bfb9SStefano Zampini     if (*n_subdomains == 1) dest = 0;
671614f0bfb9SStefano Zampini     else dest = rank;
671757de7509SStefano Zampini     if (im_active) {
671857de7509SStefano Zampini       issize = 1;
671957de7509SStefano Zampini       if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */
672014f0bfb9SStefano Zampini         isidx = procs_candidates[dest];
672157de7509SStefano Zampini       } else {
672214f0bfb9SStefano Zampini         isidx = dest;
672357de7509SStefano Zampini       }
672457de7509SStefano Zampini     } else {
672557de7509SStefano Zampini       issize = 0;
672657de7509SStefano Zampini       isidx = -1;
672757de7509SStefano Zampini     }
6728bb360cb4SStefano Zampini     if (*n_subdomains != 1) *n_subdomains = active_procs;
672957de7509SStefano Zampini     ierr = ISCreateGeneral(PetscObjectComm((PetscObject)mat),issize,&isidx,PETSC_COPY_VALUES,is_sends);CHKERRQ(ierr);
6730daf8a457SStefano Zampini     ierr = PetscFree(procs_candidates);CHKERRQ(ierr);
673157de7509SStefano Zampini     PetscFunctionReturn(0);
673257de7509SStefano Zampini   }
6733c5929fdfSBarry Smith   ierr = PetscOptionsGetBool(NULL,NULL,"-matis_partitioning_use_vwgt",&use_vwgt,NULL);CHKERRQ(ierr);
6734c5929fdfSBarry Smith   ierr = PetscOptionsGetInt(NULL,NULL,"-matis_partitioning_threshold",&threshold,NULL);CHKERRQ(ierr);
673527b6a85dSStefano Zampini   threshold = PetscMax(threshold,2);
6736e7931f94SStefano Zampini 
6737e7931f94SStefano Zampini   /* Get info on mapping */
67383bbff08aSStefano Zampini   ierr = ISLocalToGlobalMappingGetInfo(mat->rmap->mapping,&n_neighs,&neighs,&n_shared,&shared);CHKERRQ(ierr);
6739e7931f94SStefano Zampini 
6740e7931f94SStefano Zampini   /* build local CSR graph of subdomains' connectivity */
6741785e854fSJed Brown   ierr = PetscMalloc1(2,&xadj);CHKERRQ(ierr);
6742e7931f94SStefano Zampini   xadj[0] = 0;
6743e7931f94SStefano Zampini   xadj[1] = PetscMax(n_neighs-1,0);
6744785e854fSJed Brown   ierr = PetscMalloc1(xadj[1],&adjncy);CHKERRQ(ierr);
6745785e854fSJed Brown   ierr = PetscMalloc1(xadj[1],&adjncy_wgt);CHKERRQ(ierr);
6746bb360cb4SStefano Zampini   ierr = PetscCalloc1(n,&count);CHKERRQ(ierr);
674727b6a85dSStefano Zampini   for (i=1;i<n_neighs;i++)
674827b6a85dSStefano Zampini     for (j=0;j<n_shared[i];j++)
674927b6a85dSStefano Zampini       count[shared[i][j]] += 1;
6750e7931f94SStefano Zampini 
675127b6a85dSStefano Zampini   xadj_count = 0;
67522b510759SStefano Zampini   for (i=1;i<n_neighs;i++) {
675327b6a85dSStefano Zampini     for (j=0;j<n_shared[i];j++) {
675427b6a85dSStefano Zampini       if (count[shared[i][j]] < threshold) {
6755d023bfaeSStefano Zampini         adjncy[xadj_count] = neighs[i];
6756d023bfaeSStefano Zampini         adjncy_wgt[xadj_count] = n_shared[i];
6757d023bfaeSStefano Zampini         xadj_count++;
675827b6a85dSStefano Zampini         break;
675927b6a85dSStefano Zampini       }
6760e7931f94SStefano Zampini     }
6761e7931f94SStefano Zampini   }
6762d023bfaeSStefano Zampini   xadj[1] = xadj_count;
676327b6a85dSStefano Zampini   ierr = PetscFree(count);CHKERRQ(ierr);
67643bbff08aSStefano Zampini   ierr = ISLocalToGlobalMappingRestoreInfo(mat->rmap->mapping,&n_neighs,&neighs,&n_shared,&shared);CHKERRQ(ierr);
6765e7931f94SStefano Zampini   ierr = PetscSortIntWithArray(xadj[1],adjncy,adjncy_wgt);CHKERRQ(ierr);
6766e7931f94SStefano Zampini 
67673837a79fSStefano Zampini   ierr = PetscMalloc1(1,&ranks_send_to_idx);CHKERRQ(ierr);
6768e7931f94SStefano Zampini 
676927b6a85dSStefano Zampini   /* Restrict work on active processes only */
677027b6a85dSStefano Zampini   ierr = PetscMPIIntCast(im_active,&color);CHKERRQ(ierr);
677127b6a85dSStefano Zampini   if (void_procs) {
677227b6a85dSStefano Zampini     ierr = PetscSubcommCreate(PetscObjectComm((PetscObject)mat),&psubcomm);CHKERRQ(ierr);
677327b6a85dSStefano Zampini     ierr = PetscSubcommSetNumber(psubcomm,2);CHKERRQ(ierr); /* 2 groups, active process and not active processes */
677427b6a85dSStefano Zampini     ierr = PetscSubcommSetTypeGeneral(psubcomm,color,rank);CHKERRQ(ierr);
677527b6a85dSStefano Zampini     subcomm = PetscSubcommChild(psubcomm);
677627b6a85dSStefano Zampini   } else {
677727b6a85dSStefano Zampini     psubcomm = NULL;
677827b6a85dSStefano Zampini     subcomm = PetscObjectComm((PetscObject)mat);
677927b6a85dSStefano Zampini   }
678027b6a85dSStefano Zampini 
678127b6a85dSStefano Zampini   v_wgt = NULL;
678227b6a85dSStefano Zampini   if (!color) {
6783e7931f94SStefano Zampini     ierr = PetscFree(xadj);CHKERRQ(ierr);
6784e7931f94SStefano Zampini     ierr = PetscFree(adjncy);CHKERRQ(ierr);
6785e7931f94SStefano Zampini     ierr = PetscFree(adjncy_wgt);CHKERRQ(ierr);
6786c8587f34SStefano Zampini   } else {
678752e5ac9dSStefano Zampini     Mat             subdomain_adj;
678852e5ac9dSStefano Zampini     IS              new_ranks,new_ranks_contig;
678952e5ac9dSStefano Zampini     MatPartitioning partitioner;
679027b6a85dSStefano Zampini     PetscInt        rstart=0,rend=0;
679152e5ac9dSStefano Zampini     PetscInt        *is_indices,*oldranks;
679257de7509SStefano Zampini     PetscMPIInt     size;
6793b0c7d250SStefano Zampini     PetscBool       aggregate;
6794b0c7d250SStefano Zampini 
679527b6a85dSStefano Zampini     ierr = MPI_Comm_size(subcomm,&size);CHKERRQ(ierr);
679627b6a85dSStefano Zampini     if (void_procs) {
679727b6a85dSStefano Zampini       PetscInt prank = rank;
6798785e854fSJed Brown       ierr = PetscMalloc1(size,&oldranks);CHKERRQ(ierr);
679927b6a85dSStefano Zampini       ierr = MPI_Allgather(&prank,1,MPIU_INT,oldranks,1,MPIU_INT,subcomm);CHKERRQ(ierr);
6800e7931f94SStefano Zampini       for (i=0;i<xadj[1];i++) {
6801e7931f94SStefano Zampini         ierr = PetscFindInt(adjncy[i],size,oldranks,&adjncy[i]);CHKERRQ(ierr);
6802c8587f34SStefano Zampini       }
6803e7931f94SStefano Zampini       ierr = PetscSortIntWithArray(xadj[1],adjncy,adjncy_wgt);CHKERRQ(ierr);
680427b6a85dSStefano Zampini     } else {
680527b6a85dSStefano Zampini       oldranks = NULL;
680627b6a85dSStefano Zampini     }
6807b0c7d250SStefano Zampini     aggregate = ((redprocs > 0 && redprocs < size) ? PETSC_TRUE : PETSC_FALSE);
680827b6a85dSStefano Zampini     if (aggregate) { /* TODO: all this part could be made more efficient */
6809b0c7d250SStefano Zampini       PetscInt    lrows,row,ncols,*cols;
6810b0c7d250SStefano Zampini       PetscMPIInt nrank;
6811b0c7d250SStefano Zampini       PetscScalar *vals;
6812b0c7d250SStefano Zampini 
681327b6a85dSStefano Zampini       ierr = MPI_Comm_rank(subcomm,&nrank);CHKERRQ(ierr);
6814b0c7d250SStefano Zampini       lrows = 0;
6815b0c7d250SStefano Zampini       if (nrank<redprocs) {
6816b0c7d250SStefano Zampini         lrows = size/redprocs;
6817b0c7d250SStefano Zampini         if (nrank<size%redprocs) lrows++;
6818b0c7d250SStefano Zampini       }
681927b6a85dSStefano Zampini       ierr = MatCreateAIJ(subcomm,lrows,lrows,size,size,50,NULL,50,NULL,&subdomain_adj);CHKERRQ(ierr);
6820b0c7d250SStefano Zampini       ierr = MatGetOwnershipRange(subdomain_adj,&rstart,&rend);CHKERRQ(ierr);
6821b0c7d250SStefano Zampini       ierr = MatSetOption(subdomain_adj,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
6822b0c7d250SStefano Zampini       ierr = MatSetOption(subdomain_adj,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
6823b0c7d250SStefano Zampini       row = nrank;
6824b0c7d250SStefano Zampini       ncols = xadj[1]-xadj[0];
6825b0c7d250SStefano Zampini       cols = adjncy;
6826b0c7d250SStefano Zampini       ierr = PetscMalloc1(ncols,&vals);CHKERRQ(ierr);
6827b0c7d250SStefano Zampini       for (i=0;i<ncols;i++) vals[i] = adjncy_wgt[i];
6828b0c7d250SStefano Zampini       ierr = MatSetValues(subdomain_adj,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr);
6829b0c7d250SStefano Zampini       ierr = MatAssemblyBegin(subdomain_adj,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
6830b0c7d250SStefano Zampini       ierr = MatAssemblyEnd(subdomain_adj,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
683152e5ac9dSStefano Zampini       ierr = PetscFree(xadj);CHKERRQ(ierr);
683252e5ac9dSStefano Zampini       ierr = PetscFree(adjncy);CHKERRQ(ierr);
683352e5ac9dSStefano Zampini       ierr = PetscFree(adjncy_wgt);CHKERRQ(ierr);
6834b0c7d250SStefano Zampini       ierr = PetscFree(vals);CHKERRQ(ierr);
683527b6a85dSStefano Zampini       if (use_vwgt) {
683627b6a85dSStefano Zampini         Vec               v;
683727b6a85dSStefano Zampini         const PetscScalar *array;
683827b6a85dSStefano Zampini         PetscInt          nl;
683927b6a85dSStefano Zampini 
684027b6a85dSStefano Zampini         ierr = MatCreateVecs(subdomain_adj,&v,NULL);CHKERRQ(ierr);
6841bb360cb4SStefano Zampini         ierr = VecSetValue(v,row,(PetscScalar)n,INSERT_VALUES);CHKERRQ(ierr);
684227b6a85dSStefano Zampini         ierr = VecAssemblyBegin(v);CHKERRQ(ierr);
684327b6a85dSStefano Zampini         ierr = VecAssemblyEnd(v);CHKERRQ(ierr);
684427b6a85dSStefano Zampini         ierr = VecGetLocalSize(v,&nl);CHKERRQ(ierr);
684527b6a85dSStefano Zampini         ierr = VecGetArrayRead(v,&array);CHKERRQ(ierr);
684627b6a85dSStefano Zampini         ierr = PetscMalloc1(nl,&v_wgt);CHKERRQ(ierr);
684722db5ddcSStefano Zampini         for (i=0;i<nl;i++) v_wgt[i] = (PetscInt)PetscRealPart(array[i]);
684827b6a85dSStefano Zampini         ierr = VecRestoreArrayRead(v,&array);CHKERRQ(ierr);
684927b6a85dSStefano Zampini         ierr = VecDestroy(&v);CHKERRQ(ierr);
685027b6a85dSStefano Zampini       }
6851b0c7d250SStefano Zampini     } else {
685227b6a85dSStefano Zampini       ierr = MatCreateMPIAdj(subcomm,1,(PetscInt)size,xadj,adjncy,adjncy_wgt,&subdomain_adj);CHKERRQ(ierr);
685327b6a85dSStefano Zampini       if (use_vwgt) {
685427b6a85dSStefano Zampini         ierr = PetscMalloc1(1,&v_wgt);CHKERRQ(ierr);
6855bb360cb4SStefano Zampini         v_wgt[0] = n;
685627b6a85dSStefano Zampini       }
6857b0c7d250SStefano Zampini     }
685822b6e8a2SStefano Zampini     /* ierr = MatView(subdomain_adj,0);CHKERRQ(ierr); */
6859e7931f94SStefano Zampini 
6860e7931f94SStefano Zampini     /* Partition */
686127b6a85dSStefano Zampini     ierr = MatPartitioningCreate(subcomm,&partitioner);CHKERRQ(ierr);
6862e7931f94SStefano Zampini     ierr = MatPartitioningSetAdjacency(partitioner,subdomain_adj);CHKERRQ(ierr);
686327b6a85dSStefano Zampini     if (v_wgt) {
6864e7931f94SStefano Zampini       ierr = MatPartitioningSetVertexWeights(partitioner,v_wgt);CHKERRQ(ierr);
6865c8587f34SStefano Zampini     }
686657de7509SStefano Zampini     *n_subdomains = PetscMin((PetscInt)size,*n_subdomains);
686757de7509SStefano Zampini     ierr = MatPartitioningSetNParts(partitioner,*n_subdomains);CHKERRQ(ierr);
6868e7931f94SStefano Zampini     ierr = MatPartitioningSetFromOptions(partitioner);CHKERRQ(ierr);
6869e7931f94SStefano Zampini     ierr = MatPartitioningApply(partitioner,&new_ranks);CHKERRQ(ierr);
687022b6e8a2SStefano Zampini     /* ierr = MatPartitioningView(partitioner,0);CHKERRQ(ierr); */
6871e7931f94SStefano Zampini 
687252e5ac9dSStefano Zampini     /* renumber new_ranks to avoid "holes" in new set of processors */
68736583bcc1SStefano Zampini     ierr = ISRenumber(new_ranks,NULL,NULL,&new_ranks_contig);CHKERRQ(ierr);
687452e5ac9dSStefano Zampini     ierr = ISDestroy(&new_ranks);CHKERRQ(ierr);
687552e5ac9dSStefano Zampini     ierr = ISGetIndices(new_ranks_contig,(const PetscInt**)&is_indices);CHKERRQ(ierr);
687657de7509SStefano Zampini     if (!aggregate) {
687757de7509SStefano Zampini       if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */
687827b6a85dSStefano Zampini #if defined(PETSC_USE_DEBUG)
687927b6a85dSStefano Zampini         if (!oldranks) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen");
688027b6a85dSStefano Zampini #endif
688157de7509SStefano Zampini         ranks_send_to_idx[0] = procs_candidates[oldranks[is_indices[0]]];
688227b6a85dSStefano Zampini       } else if (oldranks) {
6883b0c7d250SStefano Zampini         ranks_send_to_idx[0] = oldranks[is_indices[0]];
688427b6a85dSStefano Zampini       } else {
688527b6a85dSStefano Zampini         ranks_send_to_idx[0] = is_indices[0];
688657de7509SStefano Zampini       }
688728143c3dSStefano Zampini     } else {
68887fb8a5e4SKarl Rupp       PetscInt    idx = 0;
6889b0c7d250SStefano Zampini       PetscMPIInt tag;
6890b0c7d250SStefano Zampini       MPI_Request *reqs;
6891b0c7d250SStefano Zampini 
6892b0c7d250SStefano Zampini       ierr = PetscObjectGetNewTag((PetscObject)subdomain_adj,&tag);CHKERRQ(ierr);
6893b0c7d250SStefano Zampini       ierr = PetscMalloc1(rend-rstart,&reqs);CHKERRQ(ierr);
6894b0c7d250SStefano Zampini       for (i=rstart;i<rend;i++) {
689527b6a85dSStefano Zampini         ierr = MPI_Isend(is_indices+i-rstart,1,MPIU_INT,i,tag,subcomm,&reqs[i-rstart]);CHKERRQ(ierr);
689628143c3dSStefano Zampini       }
68977fb8a5e4SKarl Rupp       ierr = MPI_Recv(&idx,1,MPIU_INT,MPI_ANY_SOURCE,tag,subcomm,MPI_STATUS_IGNORE);CHKERRQ(ierr);
6898b0c7d250SStefano Zampini       ierr = MPI_Waitall(rend-rstart,reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
6899b0c7d250SStefano Zampini       ierr = PetscFree(reqs);CHKERRQ(ierr);
690057de7509SStefano Zampini       if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */
690127b6a85dSStefano Zampini #if defined(PETSC_USE_DEBUG)
690227b6a85dSStefano Zampini         if (!oldranks) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen");
690327b6a85dSStefano Zampini #endif
69047fb8a5e4SKarl Rupp         ranks_send_to_idx[0] = procs_candidates[oldranks[idx]];
690527b6a85dSStefano Zampini       } else if (oldranks) {
69067fb8a5e4SKarl Rupp         ranks_send_to_idx[0] = oldranks[idx];
690727b6a85dSStefano Zampini       } else {
69087fb8a5e4SKarl Rupp         ranks_send_to_idx[0] = idx;
6909e7931f94SStefano Zampini       }
691057de7509SStefano Zampini     }
691152e5ac9dSStefano Zampini     ierr = ISRestoreIndices(new_ranks_contig,(const PetscInt**)&is_indices);CHKERRQ(ierr);
6912e7931f94SStefano Zampini     /* clean up */
6913e7931f94SStefano Zampini     ierr = PetscFree(oldranks);CHKERRQ(ierr);
691452e5ac9dSStefano Zampini     ierr = ISDestroy(&new_ranks_contig);CHKERRQ(ierr);
6915e7931f94SStefano Zampini     ierr = MatDestroy(&subdomain_adj);CHKERRQ(ierr);
6916e7931f94SStefano Zampini     ierr = MatPartitioningDestroy(&partitioner);CHKERRQ(ierr);
6917e7931f94SStefano Zampini   }
691827b6a85dSStefano Zampini   ierr = PetscSubcommDestroy(&psubcomm);CHKERRQ(ierr);
691957de7509SStefano Zampini   ierr = PetscFree(procs_candidates);CHKERRQ(ierr);
6920e7931f94SStefano Zampini 
6921e7931f94SStefano Zampini   /* assemble parallel IS for sends */
6922e7931f94SStefano Zampini   i = 1;
692327b6a85dSStefano Zampini   if (!color) i=0;
692457de7509SStefano Zampini   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)mat),i,ranks_send_to_idx,PETSC_OWN_POINTER,is_sends);CHKERRQ(ierr);
6925e7931f94SStefano Zampini   PetscFunctionReturn(0);
6926e7931f94SStefano Zampini }
6927e7931f94SStefano Zampini 
6928e7931f94SStefano Zampini typedef enum {MATDENSE_PRIVATE=0,MATAIJ_PRIVATE,MATBAIJ_PRIVATE,MATSBAIJ_PRIVATE}MatTypePrivate;
6929e7931f94SStefano Zampini 
69301e0482f5SStefano Zampini PetscErrorCode PCBDDCMatISSubassemble(Mat mat, IS is_sends, PetscInt n_subdomains, PetscBool restrict_comm, PetscBool restrict_full, PetscBool reuse, Mat *mat_n, PetscInt nis, IS isarray[], PetscInt nvecs, Vec nnsp_vec[])
6931e7931f94SStefano Zampini {
693270cf5478SStefano Zampini   Mat                    local_mat;
6933e7931f94SStefano Zampini   IS                     is_sends_internal;
69349d30be91SStefano Zampini   PetscInt               rows,cols,new_local_rows;
69351ae86dd6SStefano Zampini   PetscInt               i,bs,buf_size_idxs,buf_size_idxs_is,buf_size_vals,buf_size_vecs;
69369d30be91SStefano Zampini   PetscBool              ismatis,isdense,newisdense,destroy_mat;
6937e7931f94SStefano Zampini   ISLocalToGlobalMapping l2gmap;
6938e7931f94SStefano Zampini   PetscInt*              l2gmap_indices;
6939e7931f94SStefano Zampini   const PetscInt*        is_indices;
6940e7931f94SStefano Zampini   MatType                new_local_type;
6941e7931f94SStefano Zampini   /* buffers */
6942e7931f94SStefano Zampini   PetscInt               *ptr_idxs,*send_buffer_idxs,*recv_buffer_idxs;
694328143c3dSStefano Zampini   PetscInt               *ptr_idxs_is,*send_buffer_idxs_is,*recv_buffer_idxs_is;
69449d30be91SStefano Zampini   PetscInt               *recv_buffer_idxs_local;
6945e7931f94SStefano Zampini   PetscScalar            *ptr_vals,*send_buffer_vals,*recv_buffer_vals;
69461ae86dd6SStefano Zampini   PetscScalar            *ptr_vecs,*send_buffer_vecs,*recv_buffer_vecs;
6947e7931f94SStefano Zampini   /* MPI */
694828143c3dSStefano Zampini   MPI_Comm               comm,comm_n;
694928143c3dSStefano Zampini   PetscSubcomm           subcomm;
6950e7931f94SStefano Zampini   PetscMPIInt            n_sends,n_recvs,commsize;
695128143c3dSStefano Zampini   PetscMPIInt            *iflags,*ilengths_idxs,*ilengths_vals,*ilengths_idxs_is;
695228143c3dSStefano Zampini   PetscMPIInt            *onodes,*onodes_is,*olengths_idxs,*olengths_idxs_is,*olengths_vals;
69531ae86dd6SStefano Zampini   PetscMPIInt            len,tag_idxs,tag_idxs_is,tag_vals,tag_vecs,source_dest;
69541ae86dd6SStefano Zampini   MPI_Request            *send_req_idxs,*send_req_idxs_is,*send_req_vals,*send_req_vecs;
69551ae86dd6SStefano Zampini   MPI_Request            *recv_req_idxs,*recv_req_idxs_is,*recv_req_vals,*recv_req_vecs;
6956e7931f94SStefano Zampini   PetscErrorCode         ierr;
6957e7931f94SStefano Zampini 
6958e7931f94SStefano Zampini   PetscFunctionBegin;
695957de7509SStefano Zampini   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
6960e7931f94SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)mat,MATIS,&ismatis);CHKERRQ(ierr);
6961fbfcfee5SBarry Smith   if (!ismatis) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot use %s on a matrix object which is not of type MATIS",PETSC_FUNCTION_NAME);
696257de7509SStefano Zampini   PetscValidLogicalCollectiveInt(mat,n_subdomains,3);
696357de7509SStefano Zampini   PetscValidLogicalCollectiveBool(mat,restrict_comm,4);
696457de7509SStefano Zampini   PetscValidLogicalCollectiveBool(mat,restrict_full,5);
696557de7509SStefano Zampini   PetscValidLogicalCollectiveBool(mat,reuse,6);
696657de7509SStefano Zampini   PetscValidLogicalCollectiveInt(mat,nis,8);
69671ae86dd6SStefano Zampini   PetscValidLogicalCollectiveInt(mat,nvecs,10);
69681ae86dd6SStefano Zampini   if (nvecs) {
69691ae86dd6SStefano Zampini     if (nvecs > 1) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Just 1 vector supported");
69701ae86dd6SStefano Zampini     PetscValidHeaderSpecific(nnsp_vec[0],VEC_CLASSID,11);
69711ae86dd6SStefano Zampini   }
697257de7509SStefano Zampini   /* further checks */
6973e7931f94SStefano Zampini   ierr = MatISGetLocalMat(mat,&local_mat);CHKERRQ(ierr);
6974e7931f94SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)local_mat,MATSEQDENSE,&isdense);CHKERRQ(ierr);
6975e7931f94SStefano Zampini   if (!isdense) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Currently cannot subassemble MATIS when local matrix type is not of type SEQDENSE");
6976e7931f94SStefano Zampini   ierr = MatGetSize(local_mat,&rows,&cols);CHKERRQ(ierr);
6977e7931f94SStefano Zampini   if (rows != cols) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Local MATIS matrices should be square");
697857de7509SStefano Zampini   if (reuse && *mat_n) {
697970cf5478SStefano Zampini     PetscInt mrows,mcols,mnrows,mncols;
698057de7509SStefano Zampini     PetscValidHeaderSpecific(*mat_n,MAT_CLASSID,7);
698170cf5478SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)*mat_n,MATIS,&ismatis);CHKERRQ(ierr);
698228143c3dSStefano Zampini     if (!ismatis) SETERRQ(PetscObjectComm((PetscObject)*mat_n),PETSC_ERR_SUP,"Cannot reuse a matrix which is not of type MATIS");
698370cf5478SStefano Zampini     ierr = MatGetSize(mat,&mrows,&mcols);CHKERRQ(ierr);
698470cf5478SStefano Zampini     ierr = MatGetSize(*mat_n,&mnrows,&mncols);CHKERRQ(ierr);
698570cf5478SStefano Zampini     if (mrows != mnrows) SETERRQ2(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot reuse matrix! Wrong number of rows %D != %D",mrows,mnrows);
698670cf5478SStefano Zampini     if (mcols != mncols) SETERRQ2(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot reuse matrix! Wrong number of cols %D != %D",mcols,mncols);
698770cf5478SStefano Zampini   }
6988e7931f94SStefano Zampini   ierr = MatGetBlockSize(local_mat,&bs);CHKERRQ(ierr);
6989e7931f94SStefano Zampini   PetscValidLogicalCollectiveInt(mat,bs,0);
699057de7509SStefano Zampini 
6991e7931f94SStefano Zampini   /* prepare IS for sending if not provided */
6992e7931f94SStefano Zampini   if (!is_sends) {
699328143c3dSStefano Zampini     if (!n_subdomains) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"You should specify either an IS or a target number of subdomains");
6994bb360cb4SStefano Zampini     ierr = PCBDDCMatISGetSubassemblingPattern(mat,&n_subdomains,0,&is_sends_internal,NULL);CHKERRQ(ierr);
6995c8587f34SStefano Zampini   } else {
6996e7931f94SStefano Zampini     ierr = PetscObjectReference((PetscObject)is_sends);CHKERRQ(ierr);
6997e7931f94SStefano Zampini     is_sends_internal = is_sends;
6998c8587f34SStefano Zampini   }
6999e7931f94SStefano Zampini 
7000e7931f94SStefano Zampini   /* get comm */
7001a316fed8SStefano Zampini   ierr = PetscObjectGetComm((PetscObject)mat,&comm);CHKERRQ(ierr);
7002e7931f94SStefano Zampini 
7003e7931f94SStefano Zampini   /* compute number of sends */
7004e7931f94SStefano Zampini   ierr = ISGetLocalSize(is_sends_internal,&i);CHKERRQ(ierr);
7005e7931f94SStefano Zampini   ierr = PetscMPIIntCast(i,&n_sends);CHKERRQ(ierr);
7006e7931f94SStefano Zampini 
7007e7931f94SStefano Zampini   /* compute number of receives */
7008e7931f94SStefano Zampini   ierr = MPI_Comm_size(comm,&commsize);CHKERRQ(ierr);
7009785e854fSJed Brown   ierr = PetscMalloc1(commsize,&iflags);CHKERRQ(ierr);
7010e7931f94SStefano Zampini   ierr = PetscMemzero(iflags,commsize*sizeof(*iflags));CHKERRQ(ierr);
7011e7931f94SStefano Zampini   ierr = ISGetIndices(is_sends_internal,&is_indices);CHKERRQ(ierr);
7012e7931f94SStefano Zampini   for (i=0;i<n_sends;i++) iflags[is_indices[i]] = 1;
7013e7931f94SStefano Zampini   ierr = PetscGatherNumberOfMessages(comm,iflags,NULL,&n_recvs);CHKERRQ(ierr);
7014e7931f94SStefano Zampini   ierr = PetscFree(iflags);CHKERRQ(ierr);
7015e7931f94SStefano Zampini 
701628143c3dSStefano Zampini   /* restrict comm if requested */
701728143c3dSStefano Zampini   subcomm = 0;
701828143c3dSStefano Zampini   destroy_mat = PETSC_FALSE;
701928143c3dSStefano Zampini   if (restrict_comm) {
7020779c1cceSStefano Zampini     PetscMPIInt color,subcommsize;
7021779c1cceSStefano Zampini 
702228143c3dSStefano Zampini     color = 0;
702353a05cb3SStefano Zampini     if (restrict_full) {
702453a05cb3SStefano Zampini       if (!n_recvs) color = 1; /* processes not receiving anything will not partecipate in new comm (full restriction) */
702553a05cb3SStefano Zampini     } else {
702653a05cb3SStefano Zampini       if (!n_recvs && n_sends) color = 1; /* just those processes that are sending but not receiving anything will not partecipate in new comm */
702753a05cb3SStefano Zampini     }
7028b2566f29SBarry Smith     ierr = MPIU_Allreduce(&color,&subcommsize,1,MPI_INT,MPI_SUM,comm);CHKERRQ(ierr);
702928143c3dSStefano Zampini     subcommsize = commsize - subcommsize;
703028143c3dSStefano Zampini     /* check if reuse has been requested */
703157de7509SStefano Zampini     if (reuse) {
703228143c3dSStefano Zampini       if (*mat_n) {
703328143c3dSStefano Zampini         PetscMPIInt subcommsize2;
703428143c3dSStefano Zampini         ierr = MPI_Comm_size(PetscObjectComm((PetscObject)*mat_n),&subcommsize2);CHKERRQ(ierr);
703528143c3dSStefano Zampini         if (subcommsize != subcommsize2) SETERRQ2(PetscObjectComm((PetscObject)*mat_n),PETSC_ERR_PLIB,"Cannot reuse matrix! wrong subcomm size %d != %d",subcommsize,subcommsize2);
703628143c3dSStefano Zampini         comm_n = PetscObjectComm((PetscObject)*mat_n);
703728143c3dSStefano Zampini       } else {
703828143c3dSStefano Zampini         comm_n = PETSC_COMM_SELF;
703928143c3dSStefano Zampini       }
704028143c3dSStefano Zampini     } else { /* MAT_INITIAL_MATRIX */
7041779c1cceSStefano Zampini       PetscMPIInt rank;
7042779c1cceSStefano Zampini 
7043779c1cceSStefano Zampini       ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
704428143c3dSStefano Zampini       ierr = PetscSubcommCreate(comm,&subcomm);CHKERRQ(ierr);
704528143c3dSStefano Zampini       ierr = PetscSubcommSetNumber(subcomm,2);CHKERRQ(ierr);
704628143c3dSStefano Zampini       ierr = PetscSubcommSetTypeGeneral(subcomm,color,rank);CHKERRQ(ierr);
7047306c2d5bSBarry Smith       comm_n = PetscSubcommChild(subcomm);
704828143c3dSStefano Zampini     }
704928143c3dSStefano Zampini     /* flag to destroy *mat_n if not significative */
705028143c3dSStefano Zampini     if (color) destroy_mat = PETSC_TRUE;
705128143c3dSStefano Zampini   } else {
705228143c3dSStefano Zampini     comm_n = comm;
705328143c3dSStefano Zampini   }
705428143c3dSStefano Zampini 
7055e7931f94SStefano Zampini   /* prepare send/receive buffers */
7056785e854fSJed Brown   ierr = PetscMalloc1(commsize,&ilengths_idxs);CHKERRQ(ierr);
7057e7931f94SStefano Zampini   ierr = PetscMemzero(ilengths_idxs,commsize*sizeof(*ilengths_idxs));CHKERRQ(ierr);
7058785e854fSJed Brown   ierr = PetscMalloc1(commsize,&ilengths_vals);CHKERRQ(ierr);
7059e7931f94SStefano Zampini   ierr = PetscMemzero(ilengths_vals,commsize*sizeof(*ilengths_vals));CHKERRQ(ierr);
706028143c3dSStefano Zampini   if (nis) {
7061854ce69bSBarry Smith     ierr = PetscCalloc1(commsize,&ilengths_idxs_is);CHKERRQ(ierr);
706228143c3dSStefano Zampini   }
7063e7931f94SStefano Zampini 
706428143c3dSStefano Zampini   /* Get data from local matrices */
70656c4ed002SBarry Smith   if (!isdense) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Subassembling of AIJ local matrices not yet implemented");
7066e7931f94SStefano Zampini     /* TODO: See below some guidelines on how to prepare the local buffers */
7067e7931f94SStefano Zampini     /*
7068e7931f94SStefano Zampini        send_buffer_vals should contain the raw values of the local matrix
7069e7931f94SStefano Zampini        send_buffer_idxs should contain:
7070e7931f94SStefano Zampini        - MatType_PRIVATE type
7071e7931f94SStefano Zampini        - PetscInt        size_of_l2gmap
7072e7931f94SStefano Zampini        - PetscInt        global_row_indices[size_of_l2gmap]
7073e7931f94SStefano Zampini        - PetscInt        all_other_info_which_is_needed_to_compute_preallocation_and_set_values
7074e7931f94SStefano Zampini     */
70756c4ed002SBarry Smith   else {
7076e7931f94SStefano Zampini     ierr = MatDenseGetArray(local_mat,&send_buffer_vals);CHKERRQ(ierr);
70773bbff08aSStefano Zampini     ierr = ISLocalToGlobalMappingGetSize(mat->rmap->mapping,&i);CHKERRQ(ierr);
7078854ce69bSBarry Smith     ierr = PetscMalloc1(i+2,&send_buffer_idxs);CHKERRQ(ierr);
7079e7931f94SStefano Zampini     send_buffer_idxs[0] = (PetscInt)MATDENSE_PRIVATE;
7080e7931f94SStefano Zampini     send_buffer_idxs[1] = i;
70813bbff08aSStefano Zampini     ierr = ISLocalToGlobalMappingGetIndices(mat->rmap->mapping,(const PetscInt**)&ptr_idxs);CHKERRQ(ierr);
7082e7931f94SStefano Zampini     ierr = PetscMemcpy(&send_buffer_idxs[2],ptr_idxs,i*sizeof(PetscInt));CHKERRQ(ierr);
70833bbff08aSStefano Zampini     ierr = ISLocalToGlobalMappingRestoreIndices(mat->rmap->mapping,(const PetscInt**)&ptr_idxs);CHKERRQ(ierr);
7084e7931f94SStefano Zampini     ierr = PetscMPIIntCast(i,&len);CHKERRQ(ierr);
7085e7931f94SStefano Zampini     for (i=0;i<n_sends;i++) {
7086e7931f94SStefano Zampini       ilengths_vals[is_indices[i]] = len*len;
7087e7931f94SStefano Zampini       ilengths_idxs[is_indices[i]] = len+2;
7088c8587f34SStefano Zampini     }
7089c8587f34SStefano Zampini   }
7090e7931f94SStefano Zampini   ierr = PetscGatherMessageLengths2(comm,n_sends,n_recvs,ilengths_idxs,ilengths_vals,&onodes,&olengths_idxs,&olengths_vals);CHKERRQ(ierr);
709128143c3dSStefano Zampini   /* additional is (if any) */
709228143c3dSStefano Zampini   if (nis) {
709328143c3dSStefano Zampini     PetscMPIInt psum;
709428143c3dSStefano Zampini     PetscInt j;
709528143c3dSStefano Zampini     for (j=0,psum=0;j<nis;j++) {
709628143c3dSStefano Zampini       PetscInt plen;
709728143c3dSStefano Zampini       ierr = ISGetLocalSize(isarray[j],&plen);CHKERRQ(ierr);
709828143c3dSStefano Zampini       ierr = PetscMPIIntCast(plen,&len);CHKERRQ(ierr);
709928143c3dSStefano Zampini       psum += len+1; /* indices + lenght */
710028143c3dSStefano Zampini     }
7101854ce69bSBarry Smith     ierr = PetscMalloc1(psum,&send_buffer_idxs_is);CHKERRQ(ierr);
710228143c3dSStefano Zampini     for (j=0,psum=0;j<nis;j++) {
710328143c3dSStefano Zampini       PetscInt plen;
710428143c3dSStefano Zampini       const PetscInt *is_array_idxs;
710528143c3dSStefano Zampini       ierr = ISGetLocalSize(isarray[j],&plen);CHKERRQ(ierr);
710628143c3dSStefano Zampini       send_buffer_idxs_is[psum] = plen;
710728143c3dSStefano Zampini       ierr = ISGetIndices(isarray[j],&is_array_idxs);CHKERRQ(ierr);
710828143c3dSStefano Zampini       ierr = PetscMemcpy(&send_buffer_idxs_is[psum+1],is_array_idxs,plen*sizeof(PetscInt));CHKERRQ(ierr);
710928143c3dSStefano Zampini       ierr = ISRestoreIndices(isarray[j],&is_array_idxs);CHKERRQ(ierr);
711028143c3dSStefano Zampini       psum += plen+1; /* indices + lenght */
711128143c3dSStefano Zampini     }
711228143c3dSStefano Zampini     for (i=0;i<n_sends;i++) {
711328143c3dSStefano Zampini       ilengths_idxs_is[is_indices[i]] = psum;
711428143c3dSStefano Zampini     }
711528143c3dSStefano Zampini     ierr = PetscGatherMessageLengths(comm,n_sends,n_recvs,ilengths_idxs_is,&onodes_is,&olengths_idxs_is);CHKERRQ(ierr);
711628143c3dSStefano Zampini   }
71173b3b1effSJed Brown   ierr = MatISRestoreLocalMat(mat,&local_mat);CHKERRQ(ierr);
711828143c3dSStefano Zampini 
7119e7931f94SStefano Zampini   buf_size_idxs = 0;
7120e7931f94SStefano Zampini   buf_size_vals = 0;
712128143c3dSStefano Zampini   buf_size_idxs_is = 0;
71221ae86dd6SStefano Zampini   buf_size_vecs = 0;
7123e7931f94SStefano Zampini   for (i=0;i<n_recvs;i++) {
7124e7931f94SStefano Zampini     buf_size_idxs += (PetscInt)olengths_idxs[i];
7125e7931f94SStefano Zampini     buf_size_vals += (PetscInt)olengths_vals[i];
712628143c3dSStefano Zampini     if (nis) buf_size_idxs_is += (PetscInt)olengths_idxs_is[i];
71271ae86dd6SStefano Zampini     if (nvecs) buf_size_vecs += (PetscInt)olengths_idxs[i];
7128e7931f94SStefano Zampini   }
7129785e854fSJed Brown   ierr = PetscMalloc1(buf_size_idxs,&recv_buffer_idxs);CHKERRQ(ierr);
7130785e854fSJed Brown   ierr = PetscMalloc1(buf_size_vals,&recv_buffer_vals);CHKERRQ(ierr);
713195ecbf38SStefano Zampini   ierr = PetscMalloc1(buf_size_idxs_is,&recv_buffer_idxs_is);CHKERRQ(ierr);
71321ae86dd6SStefano Zampini   ierr = PetscMalloc1(buf_size_vecs,&recv_buffer_vecs);CHKERRQ(ierr);
7133e7931f94SStefano Zampini 
7134e7931f94SStefano Zampini   /* get new tags for clean communications */
7135e7931f94SStefano Zampini   ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_idxs);CHKERRQ(ierr);
7136e7931f94SStefano Zampini   ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_vals);CHKERRQ(ierr);
713728143c3dSStefano Zampini   ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_idxs_is);CHKERRQ(ierr);
71381ae86dd6SStefano Zampini   ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_vecs);CHKERRQ(ierr);
7139e7931f94SStefano Zampini 
7140e7931f94SStefano Zampini   /* allocate for requests */
7141785e854fSJed Brown   ierr = PetscMalloc1(n_sends,&send_req_idxs);CHKERRQ(ierr);
7142785e854fSJed Brown   ierr = PetscMalloc1(n_sends,&send_req_vals);CHKERRQ(ierr);
714395ecbf38SStefano Zampini   ierr = PetscMalloc1(n_sends,&send_req_idxs_is);CHKERRQ(ierr);
71441ae86dd6SStefano Zampini   ierr = PetscMalloc1(n_sends,&send_req_vecs);CHKERRQ(ierr);
7145785e854fSJed Brown   ierr = PetscMalloc1(n_recvs,&recv_req_idxs);CHKERRQ(ierr);
7146785e854fSJed Brown   ierr = PetscMalloc1(n_recvs,&recv_req_vals);CHKERRQ(ierr);
714795ecbf38SStefano Zampini   ierr = PetscMalloc1(n_recvs,&recv_req_idxs_is);CHKERRQ(ierr);
71481ae86dd6SStefano Zampini   ierr = PetscMalloc1(n_recvs,&recv_req_vecs);CHKERRQ(ierr);
7149e7931f94SStefano Zampini 
7150e7931f94SStefano Zampini   /* communications */
7151e7931f94SStefano Zampini   ptr_idxs = recv_buffer_idxs;
7152e7931f94SStefano Zampini   ptr_vals = recv_buffer_vals;
715328143c3dSStefano Zampini   ptr_idxs_is = recv_buffer_idxs_is;
71541ae86dd6SStefano Zampini   ptr_vecs = recv_buffer_vecs;
7155e7931f94SStefano Zampini   for (i=0;i<n_recvs;i++) {
7156e7931f94SStefano Zampini     source_dest = onodes[i];
7157e7931f94SStefano Zampini     ierr = MPI_Irecv(ptr_idxs,olengths_idxs[i],MPIU_INT,source_dest,tag_idxs,comm,&recv_req_idxs[i]);CHKERRQ(ierr);
7158e7931f94SStefano Zampini     ierr = MPI_Irecv(ptr_vals,olengths_vals[i],MPIU_SCALAR,source_dest,tag_vals,comm,&recv_req_vals[i]);CHKERRQ(ierr);
7159e7931f94SStefano Zampini     ptr_idxs += olengths_idxs[i];
7160e7931f94SStefano Zampini     ptr_vals += olengths_vals[i];
716128143c3dSStefano Zampini     if (nis) {
716257de7509SStefano Zampini       source_dest = onodes_is[i];
716328143c3dSStefano Zampini       ierr = MPI_Irecv(ptr_idxs_is,olengths_idxs_is[i],MPIU_INT,source_dest,tag_idxs_is,comm,&recv_req_idxs_is[i]);CHKERRQ(ierr);
716428143c3dSStefano Zampini       ptr_idxs_is += olengths_idxs_is[i];
716528143c3dSStefano Zampini     }
71661ae86dd6SStefano Zampini     if (nvecs) {
71671ae86dd6SStefano Zampini       source_dest = onodes[i];
71681ae86dd6SStefano Zampini       ierr = MPI_Irecv(ptr_vecs,olengths_idxs[i]-2,MPIU_SCALAR,source_dest,tag_vecs,comm,&recv_req_vecs[i]);CHKERRQ(ierr);
71691ae86dd6SStefano Zampini       ptr_vecs += olengths_idxs[i]-2;
71701ae86dd6SStefano Zampini     }
7171e7931f94SStefano Zampini   }
7172e7931f94SStefano Zampini   for (i=0;i<n_sends;i++) {
7173e7931f94SStefano Zampini     ierr = PetscMPIIntCast(is_indices[i],&source_dest);CHKERRQ(ierr);
7174e7931f94SStefano Zampini     ierr = MPI_Isend(send_buffer_idxs,ilengths_idxs[source_dest],MPIU_INT,source_dest,tag_idxs,comm,&send_req_idxs[i]);CHKERRQ(ierr);
7175e7931f94SStefano Zampini     ierr = MPI_Isend(send_buffer_vals,ilengths_vals[source_dest],MPIU_SCALAR,source_dest,tag_vals,comm,&send_req_vals[i]);CHKERRQ(ierr);
717628143c3dSStefano Zampini     if (nis) {
717728143c3dSStefano Zampini       ierr = MPI_Isend(send_buffer_idxs_is,ilengths_idxs_is[source_dest],MPIU_INT,source_dest,tag_idxs_is,comm,&send_req_idxs_is[i]);CHKERRQ(ierr);
717828143c3dSStefano Zampini     }
71791ae86dd6SStefano Zampini     if (nvecs) {
71801ae86dd6SStefano Zampini       ierr = VecGetArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr);
71811ae86dd6SStefano Zampini       ierr = MPI_Isend(send_buffer_vecs,ilengths_idxs[source_dest]-2,MPIU_SCALAR,source_dest,tag_vecs,comm,&send_req_vecs[i]);CHKERRQ(ierr);
71821ae86dd6SStefano Zampini     }
7183e7931f94SStefano Zampini   }
7184e7931f94SStefano Zampini   ierr = ISRestoreIndices(is_sends_internal,&is_indices);CHKERRQ(ierr);
7185e7931f94SStefano Zampini   ierr = ISDestroy(&is_sends_internal);CHKERRQ(ierr);
7186e7931f94SStefano Zampini 
7187e7931f94SStefano Zampini   /* assemble new l2g map */
7188e7931f94SStefano Zampini   ierr = MPI_Waitall(n_recvs,recv_req_idxs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
7189e7931f94SStefano Zampini   ptr_idxs = recv_buffer_idxs;
71909d30be91SStefano Zampini   new_local_rows = 0;
7191e7931f94SStefano Zampini   for (i=0;i<n_recvs;i++) {
71929d30be91SStefano Zampini     new_local_rows += *(ptr_idxs+1); /* second element is the local size of the l2gmap */
7193e7931f94SStefano Zampini     ptr_idxs += olengths_idxs[i];
7194e7931f94SStefano Zampini   }
71959d30be91SStefano Zampini   ierr = PetscMalloc1(new_local_rows,&l2gmap_indices);CHKERRQ(ierr);
7196e7931f94SStefano Zampini   ptr_idxs = recv_buffer_idxs;
71979d30be91SStefano Zampini   new_local_rows = 0;
7198e7931f94SStefano Zampini   for (i=0;i<n_recvs;i++) {
71999d30be91SStefano Zampini     ierr = PetscMemcpy(&l2gmap_indices[new_local_rows],ptr_idxs+2,(*(ptr_idxs+1))*sizeof(PetscInt));CHKERRQ(ierr);
72009d30be91SStefano Zampini     new_local_rows += *(ptr_idxs+1); /* second element is the local size of the l2gmap */
7201e7931f94SStefano Zampini     ptr_idxs += olengths_idxs[i];
7202e7931f94SStefano Zampini   }
72039d30be91SStefano Zampini   ierr = PetscSortRemoveDupsInt(&new_local_rows,l2gmap_indices);CHKERRQ(ierr);
72049d30be91SStefano Zampini   ierr = ISLocalToGlobalMappingCreate(comm_n,1,new_local_rows,l2gmap_indices,PETSC_COPY_VALUES,&l2gmap);CHKERRQ(ierr);
7205e7931f94SStefano Zampini   ierr = PetscFree(l2gmap_indices);CHKERRQ(ierr);
7206e7931f94SStefano Zampini 
7207e7931f94SStefano Zampini   /* infer new local matrix type from received local matrices type */
7208e7931f94SStefano Zampini   /* currently if all local matrices are of type X, then the resulting matrix will be of type X, except for the dense case */
7209e7931f94SStefano Zampini   /* it also assumes that if the block size is set, than it is the same among all local matrices (see checks at the beginning of the function) */
7210e7931f94SStefano Zampini   if (n_recvs) {
721128143c3dSStefano Zampini     MatTypePrivate new_local_type_private = (MatTypePrivate)send_buffer_idxs[0];
7212e7931f94SStefano Zampini     ptr_idxs = recv_buffer_idxs;
7213e7931f94SStefano Zampini     for (i=0;i<n_recvs;i++) {
7214e7931f94SStefano Zampini       if ((PetscInt)new_local_type_private != *ptr_idxs) {
7215e7931f94SStefano Zampini         new_local_type_private = MATAIJ_PRIVATE;
7216e7931f94SStefano Zampini         break;
7217e7931f94SStefano Zampini       }
7218e7931f94SStefano Zampini       ptr_idxs += olengths_idxs[i];
7219e7931f94SStefano Zampini     }
7220e7931f94SStefano Zampini     switch (new_local_type_private) {
722128143c3dSStefano Zampini       case MATDENSE_PRIVATE:
7222e7931f94SStefano Zampini         new_local_type = MATSEQAIJ;
7223e7931f94SStefano Zampini         bs = 1;
7224e7931f94SStefano Zampini         break;
7225e7931f94SStefano Zampini       case MATAIJ_PRIVATE:
7226e7931f94SStefano Zampini         new_local_type = MATSEQAIJ;
7227e7931f94SStefano Zampini         bs = 1;
7228e7931f94SStefano Zampini         break;
7229e7931f94SStefano Zampini       case MATBAIJ_PRIVATE:
7230e7931f94SStefano Zampini         new_local_type = MATSEQBAIJ;
7231e7931f94SStefano Zampini         break;
7232e7931f94SStefano Zampini       case MATSBAIJ_PRIVATE:
7233e7931f94SStefano Zampini         new_local_type = MATSEQSBAIJ;
7234e7931f94SStefano Zampini         break;
7235e7931f94SStefano Zampini       default:
7236fbfcfee5SBarry Smith         SETERRQ2(comm,PETSC_ERR_SUP,"Unsupported private type %d in %s",new_local_type_private,PETSC_FUNCTION_NAME);
7237e7931f94SStefano Zampini         break;
7238e7931f94SStefano Zampini     }
7239ed8ed4edSstefano_zampini   } else { /* by default, new_local_type is seqaij */
7240ed8ed4edSstefano_zampini     new_local_type = MATSEQAIJ;
724128143c3dSStefano Zampini     bs = 1;
7242e7931f94SStefano Zampini   }
7243e7931f94SStefano Zampini 
724470cf5478SStefano Zampini   /* create MATIS object if needed */
724557de7509SStefano Zampini   if (!reuse) {
7246e7931f94SStefano Zampini     ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr);
7247e176bc59SStefano Zampini     ierr = MatCreateIS(comm_n,bs,PETSC_DECIDE,PETSC_DECIDE,rows,cols,l2gmap,NULL,mat_n);CHKERRQ(ierr);
724870cf5478SStefano Zampini   } else {
724970cf5478SStefano Zampini     /* it also destroys the local matrices */
725057de7509SStefano Zampini     if (*mat_n) {
725170cf5478SStefano Zampini       ierr = MatSetLocalToGlobalMapping(*mat_n,l2gmap,l2gmap);CHKERRQ(ierr);
725257de7509SStefano Zampini     } else { /* this is a fake object */
725357de7509SStefano Zampini       ierr = MatCreateIS(comm_n,bs,PETSC_DECIDE,PETSC_DECIDE,rows,cols,l2gmap,NULL,mat_n);CHKERRQ(ierr);
725457de7509SStefano Zampini     }
725570cf5478SStefano Zampini   }
725670cf5478SStefano Zampini   ierr = MatISGetLocalMat(*mat_n,&local_mat);CHKERRQ(ierr);
7257e7931f94SStefano Zampini   ierr = MatSetType(local_mat,new_local_type);CHKERRQ(ierr);
72589d30be91SStefano Zampini 
72599d30be91SStefano Zampini   ierr = MPI_Waitall(n_recvs,recv_req_vals,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
72609d30be91SStefano Zampini 
72619d30be91SStefano Zampini   /* Global to local map of received indices */
72629d30be91SStefano Zampini   ierr = PetscMalloc1(buf_size_idxs,&recv_buffer_idxs_local);CHKERRQ(ierr); /* needed for values insertion */
72639d30be91SStefano Zampini   ierr = ISGlobalToLocalMappingApply(l2gmap,IS_GTOLM_MASK,buf_size_idxs,recv_buffer_idxs,&i,recv_buffer_idxs_local);CHKERRQ(ierr);
72649d30be91SStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&l2gmap);CHKERRQ(ierr);
72659d30be91SStefano Zampini 
72669d30be91SStefano Zampini   /* restore attributes -> type of incoming data and its size */
72679d30be91SStefano Zampini   buf_size_idxs = 0;
72689d30be91SStefano Zampini   for (i=0;i<n_recvs;i++) {
72699d30be91SStefano Zampini     recv_buffer_idxs_local[buf_size_idxs] = recv_buffer_idxs[buf_size_idxs];
72709d30be91SStefano Zampini     recv_buffer_idxs_local[buf_size_idxs+1] = recv_buffer_idxs[buf_size_idxs+1];
72719d30be91SStefano Zampini     buf_size_idxs += (PetscInt)olengths_idxs[i];
72729d30be91SStefano Zampini   }
72739d30be91SStefano Zampini   ierr = PetscFree(recv_buffer_idxs);CHKERRQ(ierr);
72749d30be91SStefano Zampini 
72759d30be91SStefano Zampini   /* set preallocation */
72769d30be91SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)local_mat,MATSEQDENSE,&newisdense);CHKERRQ(ierr);
72779d30be91SStefano Zampini   if (!newisdense) {
72789d30be91SStefano Zampini     PetscInt *new_local_nnz=0;
72799d30be91SStefano Zampini 
72809d30be91SStefano Zampini     ptr_idxs = recv_buffer_idxs_local;
72819d30be91SStefano Zampini     if (n_recvs) {
72829d30be91SStefano Zampini       ierr = PetscCalloc1(new_local_rows,&new_local_nnz);CHKERRQ(ierr);
72839d30be91SStefano Zampini     }
72849d30be91SStefano Zampini     for (i=0;i<n_recvs;i++) {
72859d30be91SStefano Zampini       PetscInt j;
72869d30be91SStefano Zampini       if (*ptr_idxs == (PetscInt)MATDENSE_PRIVATE) { /* preallocation provided for dense case only */
72879d30be91SStefano Zampini         for (j=0;j<*(ptr_idxs+1);j++) {
72889d30be91SStefano Zampini           new_local_nnz[*(ptr_idxs+2+j)] += *(ptr_idxs+1);
72899d30be91SStefano Zampini         }
72909d30be91SStefano Zampini       } else {
72919d30be91SStefano Zampini         /* TODO */
72929d30be91SStefano Zampini       }
72939d30be91SStefano Zampini       ptr_idxs += olengths_idxs[i];
72949d30be91SStefano Zampini     }
72959d30be91SStefano Zampini     if (new_local_nnz) {
72969d30be91SStefano Zampini       for (i=0;i<new_local_rows;i++) new_local_nnz[i] = PetscMin(new_local_nnz[i],new_local_rows);
72979d30be91SStefano Zampini       ierr = MatSeqAIJSetPreallocation(local_mat,0,new_local_nnz);CHKERRQ(ierr);
72989d30be91SStefano Zampini       for (i=0;i<new_local_rows;i++) new_local_nnz[i] /= bs;
72999d30be91SStefano Zampini       ierr = MatSeqBAIJSetPreallocation(local_mat,bs,0,new_local_nnz);CHKERRQ(ierr);
73009d30be91SStefano Zampini       for (i=0;i<new_local_rows;i++) new_local_nnz[i] = PetscMax(new_local_nnz[i]-i,0);
73019d30be91SStefano Zampini       ierr = MatSeqSBAIJSetPreallocation(local_mat,bs,0,new_local_nnz);CHKERRQ(ierr);
73029d30be91SStefano Zampini     } else {
73039d30be91SStefano Zampini       ierr = MatSetUp(local_mat);CHKERRQ(ierr);
73049d30be91SStefano Zampini     }
73059d30be91SStefano Zampini     ierr = PetscFree(new_local_nnz);CHKERRQ(ierr);
73069d30be91SStefano Zampini   } else {
73079d30be91SStefano Zampini     ierr = MatSetUp(local_mat);CHKERRQ(ierr);
73089d30be91SStefano Zampini   }
7309e7931f94SStefano Zampini 
7310e7931f94SStefano Zampini   /* set values */
7311e7931f94SStefano Zampini   ptr_vals = recv_buffer_vals;
73129d30be91SStefano Zampini   ptr_idxs = recv_buffer_idxs_local;
7313e7931f94SStefano Zampini   for (i=0;i<n_recvs;i++) {
7314e7931f94SStefano Zampini     if (*ptr_idxs == (PetscInt)MATDENSE_PRIVATE) { /* values insertion provided for dense case only */
7315e7931f94SStefano Zampini       ierr = MatSetOption(local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr);
73169d30be91SStefano Zampini       ierr = MatSetValues(local_mat,*(ptr_idxs+1),ptr_idxs+2,*(ptr_idxs+1),ptr_idxs+2,ptr_vals,ADD_VALUES);CHKERRQ(ierr);
7317e7931f94SStefano Zampini       ierr = MatAssemblyBegin(local_mat,MAT_FLUSH_ASSEMBLY);CHKERRQ(ierr);
7318e7931f94SStefano Zampini       ierr = MatAssemblyEnd(local_mat,MAT_FLUSH_ASSEMBLY);CHKERRQ(ierr);
7319e7931f94SStefano Zampini       ierr = MatSetOption(local_mat,MAT_ROW_ORIENTED,PETSC_TRUE);CHKERRQ(ierr);
732028143c3dSStefano Zampini     } else {
732128143c3dSStefano Zampini       /* TODO */
7322e7931f94SStefano Zampini     }
7323e7931f94SStefano Zampini     ptr_idxs += olengths_idxs[i];
7324e7931f94SStefano Zampini     ptr_vals += olengths_vals[i];
7325e7931f94SStefano Zampini   }
7326e7931f94SStefano Zampini   ierr = MatAssemblyBegin(local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
7327e7931f94SStefano Zampini   ierr = MatAssemblyEnd(local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
73283b3b1effSJed Brown   ierr = MatISRestoreLocalMat(*mat_n,&local_mat);CHKERRQ(ierr);
732970cf5478SStefano Zampini   ierr = MatAssemblyBegin(*mat_n,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
733070cf5478SStefano Zampini   ierr = MatAssemblyEnd(*mat_n,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
73319d30be91SStefano Zampini   ierr = PetscFree(recv_buffer_vals);CHKERRQ(ierr);
7332e7931f94SStefano Zampini 
7333dfd14d43SStefano Zampini #if 0
733428143c3dSStefano Zampini   if (!restrict_comm) { /* check */
7335e7931f94SStefano Zampini     Vec       lvec,rvec;
7336e7931f94SStefano Zampini     PetscReal infty_error;
7337e7931f94SStefano Zampini 
73382a7a6963SBarry Smith     ierr = MatCreateVecs(mat,&rvec,&lvec);CHKERRQ(ierr);
7339e7931f94SStefano Zampini     ierr = VecSetRandom(rvec,NULL);CHKERRQ(ierr);
7340e7931f94SStefano Zampini     ierr = MatMult(mat,rvec,lvec);CHKERRQ(ierr);
7341e7931f94SStefano Zampini     ierr = VecScale(lvec,-1.0);CHKERRQ(ierr);
734270cf5478SStefano Zampini     ierr = MatMultAdd(*mat_n,rvec,lvec,lvec);CHKERRQ(ierr);
7343e7931f94SStefano Zampini     ierr = VecNorm(lvec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
7344e7931f94SStefano Zampini     ierr = PetscPrintf(PetscObjectComm((PetscObject)mat),"Infinity error subassembling %1.6e\n",infty_error);
7345e7931f94SStefano Zampini     ierr = VecDestroy(&rvec);CHKERRQ(ierr);
7346e7931f94SStefano Zampini     ierr = VecDestroy(&lvec);CHKERRQ(ierr);
7347e7931f94SStefano Zampini   }
734828143c3dSStefano Zampini #endif
7349e7931f94SStefano Zampini 
735028143c3dSStefano Zampini   /* assemble new additional is (if any) */
735128143c3dSStefano Zampini   if (nis) {
735228143c3dSStefano Zampini     PetscInt **temp_idxs,*count_is,j,psum;
735328143c3dSStefano Zampini 
735428143c3dSStefano Zampini     ierr = MPI_Waitall(n_recvs,recv_req_idxs_is,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
7355854ce69bSBarry Smith     ierr = PetscCalloc1(nis,&count_is);CHKERRQ(ierr);
735628143c3dSStefano Zampini     ptr_idxs = recv_buffer_idxs_is;
735728143c3dSStefano Zampini     psum = 0;
735828143c3dSStefano Zampini     for (i=0;i<n_recvs;i++) {
735928143c3dSStefano Zampini       for (j=0;j<nis;j++) {
736028143c3dSStefano Zampini         PetscInt plen = *(ptr_idxs); /* first element is the local size of IS's indices */
736128143c3dSStefano Zampini         count_is[j] += plen; /* increment counting of buffer for j-th IS */
736228143c3dSStefano Zampini         psum += plen;
736328143c3dSStefano Zampini         ptr_idxs += plen+1; /* shift pointer to received data */
736428143c3dSStefano Zampini       }
736528143c3dSStefano Zampini     }
7366854ce69bSBarry Smith     ierr = PetscMalloc1(nis,&temp_idxs);CHKERRQ(ierr);
7367854ce69bSBarry Smith     ierr = PetscMalloc1(psum,&temp_idxs[0]);CHKERRQ(ierr);
736828143c3dSStefano Zampini     for (i=1;i<nis;i++) {
736928143c3dSStefano Zampini       temp_idxs[i] = temp_idxs[i-1]+count_is[i-1];
737028143c3dSStefano Zampini     }
737128143c3dSStefano Zampini     ierr = PetscMemzero(count_is,nis*sizeof(PetscInt));CHKERRQ(ierr);
737228143c3dSStefano Zampini     ptr_idxs = recv_buffer_idxs_is;
737328143c3dSStefano Zampini     for (i=0;i<n_recvs;i++) {
737428143c3dSStefano Zampini       for (j=0;j<nis;j++) {
737528143c3dSStefano Zampini         PetscInt plen = *(ptr_idxs); /* first element is the local size of IS's indices */
737628143c3dSStefano Zampini         ierr = PetscMemcpy(&temp_idxs[j][count_is[j]],ptr_idxs+1,plen*sizeof(PetscInt));CHKERRQ(ierr);
737728143c3dSStefano Zampini         count_is[j] += plen; /* increment starting point of buffer for j-th IS */
737828143c3dSStefano Zampini         ptr_idxs += plen+1; /* shift pointer to received data */
737928143c3dSStefano Zampini       }
738028143c3dSStefano Zampini     }
738128143c3dSStefano Zampini     for (i=0;i<nis;i++) {
738228143c3dSStefano Zampini       ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr);
738328143c3dSStefano Zampini       ierr = PetscSortRemoveDupsInt(&count_is[i],temp_idxs[i]);CHKERRQ(ierr);CHKERRQ(ierr);
738428143c3dSStefano Zampini       ierr = ISCreateGeneral(comm_n,count_is[i],temp_idxs[i],PETSC_COPY_VALUES,&isarray[i]);CHKERRQ(ierr);
738528143c3dSStefano Zampini     }
738628143c3dSStefano Zampini     ierr = PetscFree(count_is);CHKERRQ(ierr);
738728143c3dSStefano Zampini     ierr = PetscFree(temp_idxs[0]);CHKERRQ(ierr);
738828143c3dSStefano Zampini     ierr = PetscFree(temp_idxs);CHKERRQ(ierr);
738928143c3dSStefano Zampini   }
7390e7931f94SStefano Zampini   /* free workspace */
739128143c3dSStefano Zampini   ierr = PetscFree(recv_buffer_idxs_is);CHKERRQ(ierr);
7392e7931f94SStefano Zampini   ierr = MPI_Waitall(n_sends,send_req_idxs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
7393e7931f94SStefano Zampini   ierr = PetscFree(send_buffer_idxs);CHKERRQ(ierr);
7394e7931f94SStefano Zampini   ierr = MPI_Waitall(n_sends,send_req_vals,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
7395e7931f94SStefano Zampini   if (isdense) {
7396e7931f94SStefano Zampini     ierr = MatISGetLocalMat(mat,&local_mat);CHKERRQ(ierr);
7397e7931f94SStefano Zampini     ierr = MatDenseRestoreArray(local_mat,&send_buffer_vals);CHKERRQ(ierr);
73983b3b1effSJed Brown     ierr = MatISRestoreLocalMat(mat,&local_mat);CHKERRQ(ierr);
7399e7931f94SStefano Zampini   } else {
7400e7931f94SStefano Zampini     /* ierr = PetscFree(send_buffer_vals);CHKERRQ(ierr); */
7401e7931f94SStefano Zampini   }
740228143c3dSStefano Zampini   if (nis) {
740328143c3dSStefano Zampini     ierr = MPI_Waitall(n_sends,send_req_idxs_is,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
740428143c3dSStefano Zampini     ierr = PetscFree(send_buffer_idxs_is);CHKERRQ(ierr);
740528143c3dSStefano Zampini   }
74061ae86dd6SStefano Zampini 
74071ae86dd6SStefano Zampini   if (nvecs) {
74081ae86dd6SStefano Zampini     ierr = MPI_Waitall(n_recvs,recv_req_vecs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
74091ae86dd6SStefano Zampini     ierr = MPI_Waitall(n_sends,send_req_vecs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
74101ae86dd6SStefano Zampini     ierr = VecRestoreArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr);
74111ae86dd6SStefano Zampini     ierr = VecDestroy(&nnsp_vec[0]);CHKERRQ(ierr);
74121ae86dd6SStefano Zampini     ierr = VecCreate(comm_n,&nnsp_vec[0]);CHKERRQ(ierr);
74131ae86dd6SStefano Zampini     ierr = VecSetSizes(nnsp_vec[0],new_local_rows,PETSC_DECIDE);CHKERRQ(ierr);
74141ae86dd6SStefano Zampini     ierr = VecSetType(nnsp_vec[0],VECSTANDARD);CHKERRQ(ierr);
74151ae86dd6SStefano Zampini     /* set values */
74161ae86dd6SStefano Zampini     ptr_vals = recv_buffer_vecs;
74171ae86dd6SStefano Zampini     ptr_idxs = recv_buffer_idxs_local;
74181ae86dd6SStefano Zampini     ierr = VecGetArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr);
74191ae86dd6SStefano Zampini     for (i=0;i<n_recvs;i++) {
74201ae86dd6SStefano Zampini       PetscInt j;
74211ae86dd6SStefano Zampini       for (j=0;j<*(ptr_idxs+1);j++) {
74221ae86dd6SStefano Zampini         send_buffer_vecs[*(ptr_idxs+2+j)] += *(ptr_vals + j);
74231ae86dd6SStefano Zampini       }
74241ae86dd6SStefano Zampini       ptr_idxs += olengths_idxs[i];
74251ae86dd6SStefano Zampini       ptr_vals += olengths_idxs[i]-2;
74261ae86dd6SStefano Zampini     }
74271ae86dd6SStefano Zampini     ierr = VecRestoreArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr);
74281ae86dd6SStefano Zampini     ierr = VecAssemblyBegin(nnsp_vec[0]);CHKERRQ(ierr);
74291ae86dd6SStefano Zampini     ierr = VecAssemblyEnd(nnsp_vec[0]);CHKERRQ(ierr);
74301ae86dd6SStefano Zampini   }
74311ae86dd6SStefano Zampini 
74321ae86dd6SStefano Zampini   ierr = PetscFree(recv_buffer_vecs);CHKERRQ(ierr);
74331ae86dd6SStefano Zampini   ierr = PetscFree(recv_buffer_idxs_local);CHKERRQ(ierr);
7434e7931f94SStefano Zampini   ierr = PetscFree(recv_req_idxs);CHKERRQ(ierr);
7435e7931f94SStefano Zampini   ierr = PetscFree(recv_req_vals);CHKERRQ(ierr);
74361ae86dd6SStefano Zampini   ierr = PetscFree(recv_req_vecs);CHKERRQ(ierr);
743728143c3dSStefano Zampini   ierr = PetscFree(recv_req_idxs_is);CHKERRQ(ierr);
7438e7931f94SStefano Zampini   ierr = PetscFree(send_req_idxs);CHKERRQ(ierr);
7439e7931f94SStefano Zampini   ierr = PetscFree(send_req_vals);CHKERRQ(ierr);
74401ae86dd6SStefano Zampini   ierr = PetscFree(send_req_vecs);CHKERRQ(ierr);
744128143c3dSStefano Zampini   ierr = PetscFree(send_req_idxs_is);CHKERRQ(ierr);
7442e7931f94SStefano Zampini   ierr = PetscFree(ilengths_vals);CHKERRQ(ierr);
7443e7931f94SStefano Zampini   ierr = PetscFree(ilengths_idxs);CHKERRQ(ierr);
7444e7931f94SStefano Zampini   ierr = PetscFree(olengths_vals);CHKERRQ(ierr);
7445e7931f94SStefano Zampini   ierr = PetscFree(olengths_idxs);CHKERRQ(ierr);
7446e7931f94SStefano Zampini   ierr = PetscFree(onodes);CHKERRQ(ierr);
744728143c3dSStefano Zampini   if (nis) {
744828143c3dSStefano Zampini     ierr = PetscFree(ilengths_idxs_is);CHKERRQ(ierr);
744928143c3dSStefano Zampini     ierr = PetscFree(olengths_idxs_is);CHKERRQ(ierr);
745028143c3dSStefano Zampini     ierr = PetscFree(onodes_is);CHKERRQ(ierr);
745128143c3dSStefano Zampini   }
745228143c3dSStefano Zampini   ierr = PetscSubcommDestroy(&subcomm);CHKERRQ(ierr);
745328143c3dSStefano Zampini   if (destroy_mat) { /* destroy mat is true only if restrict comm is true and process will not partecipate */
745428143c3dSStefano Zampini     ierr = MatDestroy(mat_n);CHKERRQ(ierr);
745528143c3dSStefano Zampini     for (i=0;i<nis;i++) {
745628143c3dSStefano Zampini       ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr);
745728143c3dSStefano Zampini     }
74581ae86dd6SStefano Zampini     if (nvecs) { /* need to match VecDestroy nnsp_vec called in the other code path */
74591ae86dd6SStefano Zampini       ierr = VecDestroy(&nnsp_vec[0]);CHKERRQ(ierr);
74601ae86dd6SStefano Zampini     }
746153a05cb3SStefano Zampini     *mat_n = NULL;
746228143c3dSStefano Zampini   }
7463e7931f94SStefano Zampini   PetscFunctionReturn(0);
7464e7931f94SStefano Zampini }
7465a57a6d2fSStefano Zampini 
746612edc857SStefano Zampini /* temporary hack into ksp private data structure */
7467af0996ceSBarry Smith #include <petsc/private/kspimpl.h>
746812edc857SStefano Zampini 
7469c8587f34SStefano Zampini PetscErrorCode PCBDDCSetUpCoarseSolver(PC pc,PetscScalar* coarse_submat_vals)
7470c8587f34SStefano Zampini {
7471c8587f34SStefano Zampini   PC_BDDC                *pcbddc = (PC_BDDC*)pc->data;
7472c8587f34SStefano Zampini   PC_IS                  *pcis = (PC_IS*)pc->data;
747320a2ab83SStefano Zampini   Mat                    coarse_mat,coarse_mat_is,coarse_submat_dense;
74741ae86dd6SStefano Zampini   Mat                    coarsedivudotp = NULL;
74751e0482f5SStefano Zampini   Mat                    coarseG,t_coarse_mat_is;
74769881197aSStefano Zampini   MatNullSpace           CoarseNullSpace = NULL;
747720a2ab83SStefano Zampini   ISLocalToGlobalMapping coarse_islg;
74786e683305SStefano Zampini   IS                     coarse_is,*isarray;
74796e683305SStefano Zampini   PetscInt               i,im_active=-1,active_procs=-1;
748030368db7SStefano Zampini   PetscInt               nis,nisdofs,nisneu,nisvert;
7481f9eb5b7dSStefano Zampini   PC                     pc_temp;
7482c8587f34SStefano Zampini   PCType                 coarse_pc_type;
7483c8587f34SStefano Zampini   KSPType                coarse_ksp_type;
7484f9eb5b7dSStefano Zampini   PetscBool              multilevel_requested,multilevel_allowed;
74857274672aSStefano Zampini   PetscBool              coarse_reuse;
74861e0482f5SStefano Zampini   PetscInt               ncoarse,nedcfield;
748768457ee5SStefano Zampini   PetscBool              compute_vecs = PETSC_FALSE;
748822bc73bbSStefano Zampini   PetscScalar            *array;
748957de7509SStefano Zampini   MatReuse               coarse_mat_reuse;
749057de7509SStefano Zampini   PetscBool              restr, full_restr, have_void;
74917de4f681Sstefano_zampini   PetscMPIInt            commsize;
74929881197aSStefano Zampini   PetscErrorCode         ierr;
7493fdc09c96SStefano Zampini 
7494c8587f34SStefano Zampini   PetscFunctionBegin;
7495c8587f34SStefano Zampini   /* Assign global numbering to coarse dofs */
749668457ee5SStefano Zampini   if (pcbddc->new_primal_space || pcbddc->coarse_size == -1) { /* a new primal space is present or it is the first initialization, so recompute global numbering */
7497fa7f1dd8SStefano Zampini     PetscInt ocoarse_size;
74985a75c04eSSatish Balay     compute_vecs = PETSC_TRUE;
74997de4f681Sstefano_zampini 
75007de4f681Sstefano_zampini     pcbddc->new_primal_space = PETSC_TRUE;
7501fa7f1dd8SStefano Zampini     ocoarse_size = pcbddc->coarse_size;
7502f4ddd8eeSStefano Zampini     ierr = PetscFree(pcbddc->global_primal_indices);CHKERRQ(ierr);
7503f4ddd8eeSStefano Zampini     ierr = PCBDDCComputePrimalNumbering(pc,&pcbddc->coarse_size,&pcbddc->global_primal_indices);CHKERRQ(ierr);
7504f4ddd8eeSStefano Zampini     /* see if we can avoid some work */
7505fa7f1dd8SStefano Zampini     if (pcbddc->coarse_ksp) { /* coarse ksp has already been created */
750651bea450SStefano Zampini       /* if the coarse size is different or we are using adaptive selection, better to not reuse the coarse matrix */
750751bea450SStefano Zampini       if (ocoarse_size != pcbddc->coarse_size || pcbddc->adaptive_selection) {
7508727cdba6SStefano Zampini         ierr = KSPReset(pcbddc->coarse_ksp);CHKERRQ(ierr);
7509fa7f1dd8SStefano Zampini         coarse_reuse = PETSC_FALSE;
7510fa7f1dd8SStefano Zampini       } else { /* we can safely reuse already computed coarse matrix */
7511fa7f1dd8SStefano Zampini         coarse_reuse = PETSC_TRUE;
7512f4ddd8eeSStefano Zampini       }
7513fa7f1dd8SStefano Zampini     } else { /* there's no coarse ksp, so we need to create the coarse matrix too */
7514fa7f1dd8SStefano Zampini       coarse_reuse = PETSC_FALSE;
7515f4ddd8eeSStefano Zampini     }
751670cf5478SStefano Zampini     /* reset any subassembling information */
751757de7509SStefano Zampini     if (!coarse_reuse || pcbddc->recompute_topography) {
751870cf5478SStefano Zampini       ierr = ISDestroy(&pcbddc->coarse_subassembling);CHKERRQ(ierr);
751957de7509SStefano Zampini     }
75206e683305SStefano Zampini   } else { /* primal space is unchanged, so we can reuse coarse matrix */
7521fa7f1dd8SStefano Zampini     coarse_reuse = PETSC_TRUE;
7522f4ddd8eeSStefano Zampini   }
752357de7509SStefano Zampini   /* assemble coarse matrix */
752457de7509SStefano Zampini   if (coarse_reuse && pcbddc->coarse_ksp) {
752557de7509SStefano Zampini     ierr = KSPGetOperators(pcbddc->coarse_ksp,&coarse_mat,NULL);CHKERRQ(ierr);
752657de7509SStefano Zampini     ierr = PetscObjectReference((PetscObject)coarse_mat);CHKERRQ(ierr);
752757de7509SStefano Zampini     coarse_mat_reuse = MAT_REUSE_MATRIX;
752818a45a71SStefano Zampini   } else {
752957de7509SStefano Zampini     coarse_mat = NULL;
753057de7509SStefano Zampini     coarse_mat_reuse = MAT_INITIAL_MATRIX;
75316e683305SStefano Zampini   }
7532e7931f94SStefano Zampini 
7533abbbba34SStefano Zampini   /* creates temporary l2gmap and IS for coarse indexes */
7534abbbba34SStefano Zampini   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),pcbddc->local_primal_size,pcbddc->global_primal_indices,PETSC_COPY_VALUES,&coarse_is);CHKERRQ(ierr);
7535abbbba34SStefano Zampini   ierr = ISLocalToGlobalMappingCreateIS(coarse_is,&coarse_islg);CHKERRQ(ierr);
7536abbbba34SStefano Zampini 
7537abbbba34SStefano Zampini   /* creates temporary MATIS object for coarse matrix */
753822bc73bbSStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,NULL,&coarse_submat_dense);CHKERRQ(ierr);
753922bc73bbSStefano Zampini   ierr = MatDenseGetArray(coarse_submat_dense,&array);CHKERRQ(ierr);
754022bc73bbSStefano Zampini   ierr = PetscMemcpy(array,coarse_submat_vals,sizeof(*coarse_submat_vals)*pcbddc->local_primal_size*pcbddc->local_primal_size);CHKERRQ(ierr);
754122bc73bbSStefano Zampini   ierr = MatDenseRestoreArray(coarse_submat_dense,&array);CHKERRQ(ierr);
7542e176bc59SStefano Zampini   ierr = MatCreateIS(PetscObjectComm((PetscObject)pc),1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_islg,NULL,&t_coarse_mat_is);CHKERRQ(ierr);
75436e683305SStefano Zampini   ierr = MatISSetLocalMat(t_coarse_mat_is,coarse_submat_dense);CHKERRQ(ierr);
75446e683305SStefano Zampini   ierr = MatAssemblyBegin(t_coarse_mat_is,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
75456e683305SStefano Zampini   ierr = MatAssemblyEnd(t_coarse_mat_is,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
7546abbbba34SStefano Zampini   ierr = MatDestroy(&coarse_submat_dense);CHKERRQ(ierr);
7547abbbba34SStefano Zampini 
754857de7509SStefano Zampini   /* count "active" (i.e. with positive local size) and "void" processes */
754957de7509SStefano Zampini   im_active = !!(pcis->n);
755057de7509SStefano Zampini   ierr = MPIU_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
755157de7509SStefano Zampini 
755214f0bfb9SStefano Zampini   /* determine number of processes partecipating to coarse solver and compute subassembling pattern */
755357de7509SStefano Zampini   /* restr : whether if we want to exclude senders (which are not receivers) from the subassembling pattern */
755457de7509SStefano Zampini   /* full_restr : just use the receivers from the subassembling pattern */
75557de4f681Sstefano_zampini   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)pc),&commsize);CHKERRQ(ierr);
755657de7509SStefano Zampini   coarse_mat_is = NULL;
755757de7509SStefano Zampini   multilevel_allowed = PETSC_FALSE;
755857de7509SStefano Zampini   multilevel_requested = PETSC_FALSE;
75591ae86dd6SStefano Zampini   pcbddc->coarse_eqs_per_proc = PetscMin(PetscMax(pcbddc->coarse_size,1),pcbddc->coarse_eqs_per_proc);
756057de7509SStefano Zampini   if (pcbddc->current_level < pcbddc->max_levels) multilevel_requested = PETSC_TRUE;
756157de7509SStefano Zampini   if (multilevel_requested) {
756257de7509SStefano Zampini     ncoarse = active_procs/pcbddc->coarsening_ratio;
756357de7509SStefano Zampini     restr = PETSC_FALSE;
756457de7509SStefano Zampini     full_restr = PETSC_FALSE;
756557de7509SStefano Zampini   } else {
756657de7509SStefano Zampini     ncoarse = pcbddc->coarse_size/pcbddc->coarse_eqs_per_proc;
756757de7509SStefano Zampini     restr = PETSC_TRUE;
756857de7509SStefano Zampini     full_restr = PETSC_TRUE;
756957de7509SStefano Zampini   }
75707de4f681Sstefano_zampini   if (!pcbddc->coarse_size || commsize == 1) multilevel_allowed = multilevel_requested = restr = full_restr = PETSC_FALSE;
757157de7509SStefano Zampini   ncoarse = PetscMax(1,ncoarse);
757257de7509SStefano Zampini   if (!pcbddc->coarse_subassembling) {
7573a198735bSStefano Zampini     if (pcbddc->coarsening_ratio > 1) {
7574bb360cb4SStefano Zampini       if (multilevel_requested) {
7575bb360cb4SStefano Zampini         ierr = PCBDDCMatISGetSubassemblingPattern(pc->pmat,&ncoarse,pcbddc->coarse_adj_red,&pcbddc->coarse_subassembling,&have_void);CHKERRQ(ierr);
7576bb360cb4SStefano Zampini       } else {
7577bb360cb4SStefano Zampini         ierr = PCBDDCMatISGetSubassemblingPattern(t_coarse_mat_is,&ncoarse,pcbddc->coarse_adj_red,&pcbddc->coarse_subassembling,&have_void);CHKERRQ(ierr);
7578bb360cb4SStefano Zampini       }
7579a198735bSStefano Zampini     } else {
75807de4f681Sstefano_zampini       PetscMPIInt rank;
7581a198735bSStefano Zampini       ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)pc),&rank);CHKERRQ(ierr);
75827de4f681Sstefano_zampini       have_void = (active_procs == (PetscInt)commsize) ? PETSC_FALSE : PETSC_TRUE;
7583a198735bSStefano Zampini       ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),1,rank,1,&pcbddc->coarse_subassembling);CHKERRQ(ierr);
7584a198735bSStefano Zampini     }
758557de7509SStefano Zampini   } else { /* if a subassembling pattern exists, then we can reuse the coarse ksp and compute the number of process involved */
758657de7509SStefano Zampini     PetscInt    psum;
758757de7509SStefano Zampini     if (pcbddc->coarse_ksp) psum = 1;
758857de7509SStefano Zampini     else psum = 0;
758957de7509SStefano Zampini     ierr = MPIU_Allreduce(&psum,&ncoarse,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
75907de4f681Sstefano_zampini     if (ncoarse < commsize) have_void = PETSC_TRUE;
759157de7509SStefano Zampini   }
759257de7509SStefano Zampini   /* determine if we can go multilevel */
759357de7509SStefano Zampini   if (multilevel_requested) {
759457de7509SStefano Zampini     if (ncoarse > 1) multilevel_allowed = PETSC_TRUE; /* found enough processes */
759557de7509SStefano Zampini     else restr = full_restr = PETSC_TRUE; /* 1 subdomain, use a direct solver */
759657de7509SStefano Zampini   }
759757de7509SStefano Zampini   if (multilevel_allowed && have_void) restr = PETSC_TRUE;
759857de7509SStefano Zampini 
7599e4d548c7SStefano Zampini   /* dump subassembling pattern */
7600e4d548c7SStefano Zampini   if (pcbddc->dbg_flag && multilevel_allowed) {
7601e4d548c7SStefano Zampini     ierr = ISView(pcbddc->coarse_subassembling,pcbddc->dbg_viewer);CHKERRQ(ierr);
7602e4d548c7SStefano Zampini   }
7603e4d548c7SStefano Zampini 
76046e683305SStefano Zampini   /* compute dofs splitting and neumann boundaries for coarse dofs */
76051e0482f5SStefano Zampini   nedcfield = -1;
76061e0482f5SStefano Zampini   if (multilevel_allowed && !coarse_reuse && (pcbddc->n_ISForDofsLocal || pcbddc->NeumannBoundariesLocal || pcbddc->nedclocal)) { /* protects from unneded computations */
76076e683305SStefano Zampini     PetscInt               *tidxs,*tidxs2,nout,tsize,i;
76086e683305SStefano Zampini     const PetscInt         *idxs;
76096e683305SStefano Zampini     ISLocalToGlobalMapping tmap;
76106e683305SStefano Zampini 
76116e683305SStefano Zampini     /* create map between primal indices (in local representative ordering) and local primal numbering */
76120be93d54SStefano Zampini     ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,1,pcbddc->local_primal_size,pcbddc->primal_indices_local_idxs,PETSC_COPY_VALUES,&tmap);CHKERRQ(ierr);
76136e683305SStefano Zampini     /* allocate space for temporary storage */
7614854ce69bSBarry Smith     ierr = PetscMalloc1(pcbddc->local_primal_size,&tidxs);CHKERRQ(ierr);
7615854ce69bSBarry Smith     ierr = PetscMalloc1(pcbddc->local_primal_size,&tidxs2);CHKERRQ(ierr);
76166e683305SStefano Zampini     /* allocate for IS array */
76176e683305SStefano Zampini     nisdofs = pcbddc->n_ISForDofsLocal;
76181e0482f5SStefano Zampini     if (pcbddc->nedclocal) {
76191e0482f5SStefano Zampini       if (pcbddc->nedfield > -1) {
76201e0482f5SStefano Zampini         nedcfield = pcbddc->nedfield;
76211e0482f5SStefano Zampini       } else {
76221e0482f5SStefano Zampini         nedcfield = 0;
76231e0482f5SStefano Zampini         if (nisdofs) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"This should not happen (%d)",nisdofs);
76241e0482f5SStefano Zampini         nisdofs = 1;
76251e0482f5SStefano Zampini       }
76261e0482f5SStefano Zampini     }
76276e683305SStefano Zampini     nisneu = !!pcbddc->NeumannBoundariesLocal;
762827b6a85dSStefano Zampini     nisvert = 0; /* nisvert is not used */
762930368db7SStefano Zampini     nis = nisdofs + nisneu + nisvert;
7630854ce69bSBarry Smith     ierr = PetscMalloc1(nis,&isarray);CHKERRQ(ierr);
76316e683305SStefano Zampini     /* dofs splitting */
76326e683305SStefano Zampini     for (i=0;i<nisdofs;i++) {
76336e683305SStefano Zampini       /* ierr = ISView(pcbddc->ISForDofsLocal[i],0);CHKERRQ(ierr); */
76341e0482f5SStefano Zampini       if (nedcfield != i) {
76356e683305SStefano Zampini         ierr = ISGetLocalSize(pcbddc->ISForDofsLocal[i],&tsize);CHKERRQ(ierr);
76366e683305SStefano Zampini         ierr = ISGetIndices(pcbddc->ISForDofsLocal[i],&idxs);CHKERRQ(ierr);
76376e683305SStefano Zampini         ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr);
76386e683305SStefano Zampini         ierr = ISRestoreIndices(pcbddc->ISForDofsLocal[i],&idxs);CHKERRQ(ierr);
76391e0482f5SStefano Zampini       } else {
76401e0482f5SStefano Zampini         ierr = ISGetLocalSize(pcbddc->nedclocal,&tsize);CHKERRQ(ierr);
76411e0482f5SStefano Zampini         ierr = ISGetIndices(pcbddc->nedclocal,&idxs);CHKERRQ(ierr);
76421e0482f5SStefano Zampini         ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr);
7643eee23b56SStefano Zampini         if (tsize != nout) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Failed when mapping coarse nedelec field! %d != %d\n",tsize,nout);
76441e0482f5SStefano Zampini         ierr = ISRestoreIndices(pcbddc->nedclocal,&idxs);CHKERRQ(ierr);
76451e0482f5SStefano Zampini       }
76466e683305SStefano Zampini       ierr = ISLocalToGlobalMappingApply(coarse_islg,nout,tidxs,tidxs2);CHKERRQ(ierr);
764730368db7SStefano Zampini       ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),nout,tidxs2,PETSC_COPY_VALUES,&isarray[i]);CHKERRQ(ierr);
76486e683305SStefano Zampini       /* ierr = ISView(isarray[i],0);CHKERRQ(ierr); */
76496e683305SStefano Zampini     }
76506e683305SStefano Zampini     /* neumann boundaries */
76516e683305SStefano Zampini     if (pcbddc->NeumannBoundariesLocal) {
76526e683305SStefano Zampini       /* ierr = ISView(pcbddc->NeumannBoundariesLocal,0);CHKERRQ(ierr); */
76536e683305SStefano Zampini       ierr = ISGetLocalSize(pcbddc->NeumannBoundariesLocal,&tsize);CHKERRQ(ierr);
76546e683305SStefano Zampini       ierr = ISGetIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr);
76556e683305SStefano Zampini       ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr);
76566e683305SStefano Zampini       ierr = ISRestoreIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr);
76576e683305SStefano Zampini       ierr = ISLocalToGlobalMappingApply(coarse_islg,nout,tidxs,tidxs2);CHKERRQ(ierr);
765830368db7SStefano Zampini       ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),nout,tidxs2,PETSC_COPY_VALUES,&isarray[nisdofs]);CHKERRQ(ierr);
76596e683305SStefano Zampini       /* ierr = ISView(isarray[nisdofs],0);CHKERRQ(ierr); */
76606e683305SStefano Zampini     }
76616e683305SStefano Zampini     /* free memory */
76626e683305SStefano Zampini     ierr = PetscFree(tidxs);CHKERRQ(ierr);
76636e683305SStefano Zampini     ierr = PetscFree(tidxs2);CHKERRQ(ierr);
76646e683305SStefano Zampini     ierr = ISLocalToGlobalMappingDestroy(&tmap);CHKERRQ(ierr);
76656e683305SStefano Zampini   } else {
76666e683305SStefano Zampini     nis = 0;
76676e683305SStefano Zampini     nisdofs = 0;
76686e683305SStefano Zampini     nisneu = 0;
766930368db7SStefano Zampini     nisvert = 0;
76706e683305SStefano Zampini     isarray = NULL;
76716e683305SStefano Zampini   }
76726e683305SStefano Zampini   /* destroy no longer needed map */
76736e683305SStefano Zampini   ierr = ISLocalToGlobalMappingDestroy(&coarse_islg);CHKERRQ(ierr);
76746e683305SStefano Zampini 
767557de7509SStefano Zampini   /* subassemble */
767657de7509SStefano Zampini   if (multilevel_allowed) {
76771ae86dd6SStefano Zampini     Vec       vp[1];
76781ae86dd6SStefano Zampini     PetscInt  nvecs = 0;
767957de7509SStefano Zampini     PetscBool reuse,reuser;
76801ae86dd6SStefano Zampini 
768157de7509SStefano Zampini     if (coarse_mat) reuse = PETSC_TRUE;
768257de7509SStefano Zampini     else reuse = PETSC_FALSE;
768357de7509SStefano Zampini     ierr = MPIU_Allreduce(&reuse,&reuser,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
76841ae86dd6SStefano Zampini     vp[0] = NULL;
76851ae86dd6SStefano Zampini     if (pcbddc->benign_have_null) { /* propagate no-net-flux quadrature to coarser level */
76861ae86dd6SStefano Zampini       ierr = VecCreate(PetscObjectComm((PetscObject)pc),&vp[0]);CHKERRQ(ierr);
76871ae86dd6SStefano Zampini       ierr = VecSetSizes(vp[0],pcbddc->local_primal_size,PETSC_DECIDE);CHKERRQ(ierr);
76881ae86dd6SStefano Zampini       ierr = VecSetType(vp[0],VECSTANDARD);CHKERRQ(ierr);
76891ae86dd6SStefano Zampini       nvecs = 1;
76901ae86dd6SStefano Zampini 
76911ae86dd6SStefano Zampini       if (pcbddc->divudotp) {
7692a198735bSStefano Zampini         Mat      B,loc_divudotp;
76931ae86dd6SStefano Zampini         Vec      v,p;
76941ae86dd6SStefano Zampini         IS       dummy;
76951ae86dd6SStefano Zampini         PetscInt np;
76961ae86dd6SStefano Zampini 
7697a198735bSStefano Zampini         ierr = MatISGetLocalMat(pcbddc->divudotp,&loc_divudotp);CHKERRQ(ierr);
7698a198735bSStefano Zampini         ierr = MatGetSize(loc_divudotp,&np,NULL);CHKERRQ(ierr);
76991ae86dd6SStefano Zampini         ierr = ISCreateStride(PETSC_COMM_SELF,np,0,1,&dummy);CHKERRQ(ierr);
77007dae84e0SHong Zhang         ierr = MatCreateSubMatrix(loc_divudotp,dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr);
77011ae86dd6SStefano Zampini         ierr = MatCreateVecs(B,&v,&p);CHKERRQ(ierr);
77021ae86dd6SStefano Zampini         ierr = VecSet(p,1.);CHKERRQ(ierr);
77031ae86dd6SStefano Zampini         ierr = MatMultTranspose(B,p,v);CHKERRQ(ierr);
77041ae86dd6SStefano Zampini         ierr = VecDestroy(&p);CHKERRQ(ierr);
77051ae86dd6SStefano Zampini         ierr = MatDestroy(&B);CHKERRQ(ierr);
77061ae86dd6SStefano Zampini         ierr = VecGetArray(vp[0],&array);CHKERRQ(ierr);
77071ae86dd6SStefano Zampini         ierr = VecPlaceArray(pcbddc->vec1_P,array);CHKERRQ(ierr);
77081ae86dd6SStefano Zampini         ierr = VecRestoreArray(vp[0],&array);CHKERRQ(ierr);
77091ae86dd6SStefano Zampini         ierr = MatMultTranspose(pcbddc->coarse_phi_B,v,pcbddc->vec1_P);CHKERRQ(ierr);
77101ae86dd6SStefano Zampini         ierr = VecResetArray(pcbddc->vec1_P);CHKERRQ(ierr);
77111ae86dd6SStefano Zampini         ierr = ISDestroy(&dummy);CHKERRQ(ierr);
77121ae86dd6SStefano Zampini         ierr = VecDestroy(&v);CHKERRQ(ierr);
771374e2c79eSStefano Zampini       }
77141ae86dd6SStefano Zampini     }
77151ae86dd6SStefano Zampini     if (reuser) {
77161e0482f5SStefano Zampini       ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_TRUE,&coarse_mat,nis,isarray,nvecs,vp);CHKERRQ(ierr);
771774e2c79eSStefano Zampini     } else {
77181e0482f5SStefano Zampini       ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_FALSE,&coarse_mat_is,nis,isarray,nvecs,vp);CHKERRQ(ierr);
77191ae86dd6SStefano Zampini     }
77201ae86dd6SStefano Zampini     if (vp[0]) { /* vp[0] could have been placed on a different set of processes */
77211ae86dd6SStefano Zampini       PetscScalar *arraym,*arrayv;
77221ae86dd6SStefano Zampini       PetscInt    nl;
77231ae86dd6SStefano Zampini       ierr = VecGetLocalSize(vp[0],&nl);CHKERRQ(ierr);
77241ae86dd6SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,1,nl,NULL,&coarsedivudotp);CHKERRQ(ierr);
77251ae86dd6SStefano Zampini       ierr = MatDenseGetArray(coarsedivudotp,&arraym);CHKERRQ(ierr);
77261ae86dd6SStefano Zampini       ierr = VecGetArray(vp[0],&arrayv);CHKERRQ(ierr);
77271ae86dd6SStefano Zampini       ierr = PetscMemcpy(arraym,arrayv,nl*sizeof(PetscScalar));CHKERRQ(ierr);
77281ae86dd6SStefano Zampini       ierr = VecRestoreArray(vp[0],&arrayv);CHKERRQ(ierr);
77291ae86dd6SStefano Zampini       ierr = MatDenseRestoreArray(coarsedivudotp,&arraym);CHKERRQ(ierr);
77301ae86dd6SStefano Zampini       ierr = VecDestroy(&vp[0]);CHKERRQ(ierr);
7731a198735bSStefano Zampini     } else {
7732a198735bSStefano Zampini       ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,0,0,1,NULL,&coarsedivudotp);CHKERRQ(ierr);
77331ae86dd6SStefano Zampini     }
77341ae86dd6SStefano Zampini   } else {
77351e0482f5SStefano Zampini     ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_FALSE,&coarse_mat_is,0,NULL,0,NULL);CHKERRQ(ierr);
77366e683305SStefano Zampini   }
773757de7509SStefano Zampini   if (coarse_mat_is || coarse_mat) {
773857de7509SStefano Zampini     PetscMPIInt size;
7739f913dca9SStefano Zampini     ierr = MPI_Comm_size(PetscObjectComm((PetscObject)coarse_mat_is),&size);CHKERRQ(ierr);
774057de7509SStefano Zampini     if (!multilevel_allowed) {
774157de7509SStefano Zampini       ierr = MatISGetMPIXAIJ(coarse_mat_is,coarse_mat_reuse,&coarse_mat);CHKERRQ(ierr);
77426e683305SStefano Zampini     } else {
774357de7509SStefano Zampini       Mat A;
7744779c1cceSStefano Zampini 
774557de7509SStefano Zampini       /* if this matrix is present, it means we are not reusing the coarse matrix */
774657de7509SStefano Zampini       if (coarse_mat_is) {
774757de7509SStefano Zampini         if (coarse_mat) SETERRQ(PetscObjectComm((PetscObject)coarse_mat_is),PETSC_ERR_PLIB,"This should not happen");
774857de7509SStefano Zampini         ierr = PetscObjectReference((PetscObject)coarse_mat_is);CHKERRQ(ierr);
774957de7509SStefano Zampini         coarse_mat = coarse_mat_is;
775057de7509SStefano Zampini       }
775157de7509SStefano Zampini       /* be sure we don't have MatSeqDENSE as local mat */
775257de7509SStefano Zampini       ierr = MatISGetLocalMat(coarse_mat,&A);CHKERRQ(ierr);
775357de7509SStefano Zampini       ierr = MatConvert(A,MATSEQAIJ,MAT_INPLACE_MATRIX,&A);CHKERRQ(ierr);
7754779c1cceSStefano Zampini     }
7755779c1cceSStefano Zampini   }
775657de7509SStefano Zampini   ierr = MatDestroy(&t_coarse_mat_is);CHKERRQ(ierr);
775757de7509SStefano Zampini   ierr = MatDestroy(&coarse_mat_is);CHKERRQ(ierr);
77586e683305SStefano Zampini 
77596e683305SStefano Zampini   /* create local to global scatters for coarse problem */
776068457ee5SStefano Zampini   if (compute_vecs) {
77616e683305SStefano Zampini     PetscInt lrows;
77626e683305SStefano Zampini     ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
776357de7509SStefano Zampini     if (coarse_mat) {
776457de7509SStefano Zampini       ierr = MatGetLocalSize(coarse_mat,&lrows,NULL);CHKERRQ(ierr);
77656e683305SStefano Zampini     } else {
77666e683305SStefano Zampini       lrows = 0;
77676e683305SStefano Zampini     }
77686e683305SStefano Zampini     ierr = VecCreate(PetscObjectComm((PetscObject)pc),&pcbddc->coarse_vec);CHKERRQ(ierr);
77696e683305SStefano Zampini     ierr = VecSetSizes(pcbddc->coarse_vec,lrows,PETSC_DECIDE);CHKERRQ(ierr);
77706e683305SStefano Zampini     ierr = VecSetType(pcbddc->coarse_vec,VECSTANDARD);CHKERRQ(ierr);
77716e683305SStefano Zampini     ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
77726e683305SStefano Zampini     ierr = VecScatterCreate(pcbddc->vec1_P,NULL,pcbddc->coarse_vec,coarse_is,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
77736e683305SStefano Zampini   }
77746e683305SStefano Zampini   ierr = ISDestroy(&coarse_is);CHKERRQ(ierr);
7775c8587f34SStefano Zampini 
7776f9eb5b7dSStefano Zampini   /* set defaults for coarse KSP and PC */
7777f9eb5b7dSStefano Zampini   if (multilevel_allowed) {
7778f9eb5b7dSStefano Zampini     coarse_ksp_type = KSPRICHARDSON;
7779f9eb5b7dSStefano Zampini     coarse_pc_type = PCBDDC;
7780f9eb5b7dSStefano Zampini   } else {
7781f9eb5b7dSStefano Zampini     coarse_ksp_type = KSPPREONLY;
7782f9eb5b7dSStefano Zampini     coarse_pc_type = PCREDUNDANT;
7783c8587f34SStefano Zampini   }
7784c8587f34SStefano Zampini 
77856e683305SStefano Zampini   /* print some info if requested */
77866e683305SStefano Zampini   if (pcbddc->dbg_flag) {
77876e683305SStefano Zampini     if (!multilevel_allowed) {
77886e683305SStefano Zampini       ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
77896e683305SStefano Zampini       if (multilevel_requested) {
77906e683305SStefano Zampini         ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Not enough active processes on level %d (active processes %d, coarsening ratio %d)\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
77916e683305SStefano Zampini       } else if (pcbddc->max_levels) {
77926e683305SStefano Zampini         ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Maximum number of requested levels reached (%d)\n",pcbddc->max_levels);CHKERRQ(ierr);
77936e683305SStefano Zampini       }
77946e683305SStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
77956e683305SStefano Zampini     }
77966e683305SStefano Zampini   }
77976e683305SStefano Zampini 
77981e0482f5SStefano Zampini   /* communicate coarse discrete gradient */
77991e0482f5SStefano Zampini   coarseG = NULL;
78001e0482f5SStefano Zampini   if (pcbddc->nedcG && multilevel_allowed) {
78011e0482f5SStefano Zampini     MPI_Comm ccomm;
78021e0482f5SStefano Zampini     if (coarse_mat) {
78031e0482f5SStefano Zampini       ccomm = PetscObjectComm((PetscObject)coarse_mat);
78041e0482f5SStefano Zampini     } else {
78051e0482f5SStefano Zampini       ccomm = MPI_COMM_NULL;
78061e0482f5SStefano Zampini     }
78071e0482f5SStefano Zampini     ierr = MatMPIAIJRestrict(pcbddc->nedcG,ccomm,&coarseG);CHKERRQ(ierr);
78081e0482f5SStefano Zampini   }
78091e0482f5SStefano Zampini 
7810f9eb5b7dSStefano Zampini   /* create the coarse KSP object only once with defaults */
781157de7509SStefano Zampini   if (coarse_mat) {
78127274672aSStefano Zampini     PetscBool   isredundant,isnn,isbddc;
78136a1308c2SStefano Zampini     PetscViewer dbg_viewer = NULL;
78147274672aSStefano Zampini 
78156e683305SStefano Zampini     if (pcbddc->dbg_flag) {
781657de7509SStefano Zampini       dbg_viewer = PETSC_VIEWER_STDOUT_(PetscObjectComm((PetscObject)coarse_mat));
78176e683305SStefano Zampini       ierr = PetscViewerASCIIAddTab(dbg_viewer,2*pcbddc->current_level);CHKERRQ(ierr);
78186e683305SStefano Zampini     }
7819f9eb5b7dSStefano Zampini     if (!pcbddc->coarse_ksp) {
7820312be037SStefano Zampini       char prefix[256],str_level[16];
7821e604994aSStefano Zampini       size_t len;
78221e0482f5SStefano Zampini 
782357de7509SStefano Zampini       ierr = KSPCreate(PetscObjectComm((PetscObject)coarse_mat),&pcbddc->coarse_ksp);CHKERRQ(ierr);
7824422a814eSBarry Smith       ierr = KSPSetErrorIfNotConverged(pcbddc->coarse_ksp,pc->erroriffailure);CHKERRQ(ierr);
7825c8587f34SStefano Zampini       ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
7826f9eb5b7dSStefano Zampini       ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,1);CHKERRQ(ierr);
782757de7509SStefano Zampini       ierr = KSPSetOperators(pcbddc->coarse_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr);
7828c8587f34SStefano Zampini       ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
78296e683305SStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
7830c8587f34SStefano Zampini       ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
78311e0482f5SStefano Zampini       /* TODO is this logic correct? should check for coarse_mat type */
7832c8587f34SStefano Zampini       ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
7833e604994aSStefano Zampini       /* prefix */
7834e604994aSStefano Zampini       ierr = PetscStrcpy(prefix,"");CHKERRQ(ierr);
7835e604994aSStefano Zampini       ierr = PetscStrcpy(str_level,"");CHKERRQ(ierr);
7836e604994aSStefano Zampini       if (!pcbddc->current_level) {
7837e604994aSStefano Zampini         ierr = PetscStrcpy(prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr);
7838e604994aSStefano Zampini         ierr = PetscStrcat(prefix,"pc_bddc_coarse_");CHKERRQ(ierr);
7839c8587f34SStefano Zampini       } else {
7840e604994aSStefano Zampini         ierr = PetscStrlen(((PetscObject)pc)->prefix,&len);CHKERRQ(ierr);
7841312be037SStefano Zampini         if (pcbddc->current_level>1) len -= 3; /* remove "lX_" with X level number */
7842312be037SStefano Zampini         if (pcbddc->current_level>10) len -= 1; /* remove another char from level number */
784334d6797cSStefano Zampini         ierr = PetscStrncpy(prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr);
784435529e7bSStefano Zampini         ierr = PetscSNPrintf(str_level,sizeof(str_level),"l%d_",(int)(pcbddc->current_level));CHKERRQ(ierr);
7845e604994aSStefano Zampini         ierr = PetscStrcat(prefix,str_level);CHKERRQ(ierr);
7846e604994aSStefano Zampini       }
7847e604994aSStefano Zampini       ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,prefix);CHKERRQ(ierr);
78483e3c6dadSStefano Zampini       /* propagate BDDC info to the next level (these are dummy calls if pc_temp is not of type PCBDDC) */
78493e3c6dadSStefano Zampini       ierr = PCBDDCSetLevel(pc_temp,pcbddc->current_level+1);CHKERRQ(ierr);
78503e3c6dadSStefano Zampini       ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr);
78513e3c6dadSStefano Zampini       ierr = PCBDDCSetLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr);
7852f9eb5b7dSStefano Zampini       /* allow user customization */
7853f9eb5b7dSStefano Zampini       ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
78543e3c6dadSStefano Zampini     }
78553e3c6dadSStefano Zampini     /* propagate BDDC info to the next level (these are dummy calls if pc_temp is not of type PCBDDC) */
785651bea450SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
78573e3c6dadSStefano Zampini     if (nisdofs) {
78583e3c6dadSStefano Zampini       ierr = PCBDDCSetDofsSplitting(pc_temp,nisdofs,isarray);CHKERRQ(ierr);
78593e3c6dadSStefano Zampini       for (i=0;i<nisdofs;i++) {
78603e3c6dadSStefano Zampini         ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr);
78613e3c6dadSStefano Zampini       }
78623e3c6dadSStefano Zampini     }
78633e3c6dadSStefano Zampini     if (nisneu) {
78643e3c6dadSStefano Zampini       ierr = PCBDDCSetNeumannBoundaries(pc_temp,isarray[nisdofs]);CHKERRQ(ierr);
78653e3c6dadSStefano Zampini       ierr = ISDestroy(&isarray[nisdofs]);CHKERRQ(ierr);
7866312be037SStefano Zampini     }
786730368db7SStefano Zampini     if (nisvert) {
786830368db7SStefano Zampini       ierr = PCBDDCSetPrimalVerticesIS(pc_temp,isarray[nis-1]);CHKERRQ(ierr);
786930368db7SStefano Zampini       ierr = ISDestroy(&isarray[nis-1]);CHKERRQ(ierr);
787030368db7SStefano Zampini     }
78711e0482f5SStefano Zampini     if (coarseG) {
78721e0482f5SStefano Zampini       ierr = PCBDDCSetDiscreteGradient(pc_temp,coarseG,1,nedcfield,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr);
78731e0482f5SStefano Zampini     }
7874f9eb5b7dSStefano Zampini 
7875f9eb5b7dSStefano Zampini     /* get some info after set from options */
7876f9eb5b7dSStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr);
7877b76f3995Sstefano_zampini     /* multilevel can only be requested via -pc_bddc_levels or PCBDDCSetLevels */
7878b76f3995Sstefano_zampini     if (isbddc && !multilevel_allowed) {
7879f9eb5b7dSStefano Zampini       ierr   = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
7880f9eb5b7dSStefano Zampini       isbddc = PETSC_FALSE;
7881f9eb5b7dSStefano Zampini     }
7882b76f3995Sstefano_zampini     /* multilevel cannot be done with coarse PCs different from BDDC or NN */
78837274672aSStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCNN,&isnn);CHKERRQ(ierr);
78847274672aSStefano Zampini     if (multilevel_requested && multilevel_allowed && !isbddc && !isnn) {
7885b76f3995Sstefano_zampini       ierr   = PCSetType(pc_temp,PCBDDC);CHKERRQ(ierr);
7886b76f3995Sstefano_zampini       isbddc = PETSC_TRUE;
7887b76f3995Sstefano_zampini     }
788839f0f02cSStefano Zampini     ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr);
78897274672aSStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCREDUNDANT,&isredundant);CHKERRQ(ierr);
78904f3a063dSStefano Zampini     if (isredundant) {
78914f3a063dSStefano Zampini       KSP inner_ksp;
78924f3a063dSStefano Zampini       PC  inner_pc;
78939326c5c6Sstefano_zampini 
78944f3a063dSStefano Zampini       ierr = PCRedundantGetKSP(pc_temp,&inner_ksp);CHKERRQ(ierr);
78954f3a063dSStefano Zampini       ierr = KSPGetPC(inner_ksp,&inner_pc);CHKERRQ(ierr);
78964f3a063dSStefano Zampini       ierr = PCFactorSetReuseFill(inner_pc,PETSC_TRUE);CHKERRQ(ierr);
78974f3a063dSStefano Zampini     }
7898f9eb5b7dSStefano Zampini 
789957de7509SStefano Zampini     /* parameters which miss an API */
79007274672aSStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr);
790157de7509SStefano Zampini     if (isbddc) {
7902720d30f9SStefano Zampini       PC_BDDC* pcbddc_coarse = (PC_BDDC*)pc_temp->data;
79037274672aSStefano Zampini 
7904720d30f9SStefano Zampini       pcbddc_coarse->detect_disconnected = PETSC_TRUE;
790557de7509SStefano Zampini       pcbddc_coarse->coarse_eqs_per_proc = pcbddc->coarse_eqs_per_proc;
790627b6a85dSStefano Zampini       pcbddc_coarse->benign_saddle_point = pcbddc->benign_have_null;
790727b6a85dSStefano Zampini       if (pcbddc_coarse->benign_saddle_point) {
7908a198735bSStefano Zampini         Mat                    coarsedivudotp_is;
7909a198735bSStefano Zampini         ISLocalToGlobalMapping l2gmap,rl2g,cl2g;
7910a198735bSStefano Zampini         IS                     row,col;
7911a198735bSStefano Zampini         const PetscInt         *gidxs;
7912a198735bSStefano Zampini         PetscInt               n,st,M,N;
7913a198735bSStefano Zampini 
7914a198735bSStefano Zampini         ierr = MatGetSize(coarsedivudotp,&n,NULL);CHKERRQ(ierr);
7915a198735bSStefano Zampini         ierr = MPI_Scan(&n,&st,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)coarse_mat));CHKERRQ(ierr);
7916a198735bSStefano Zampini         st   = st-n;
7917a198735bSStefano Zampini         ierr = ISCreateStride(PetscObjectComm((PetscObject)coarse_mat),1,st,1,&row);CHKERRQ(ierr);
7918a198735bSStefano Zampini         ierr = MatGetLocalToGlobalMapping(coarse_mat,&l2gmap,NULL);CHKERRQ(ierr);
7919a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingGetSize(l2gmap,&n);CHKERRQ(ierr);
7920a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingGetIndices(l2gmap,&gidxs);CHKERRQ(ierr);
7921a198735bSStefano Zampini         ierr = ISCreateGeneral(PetscObjectComm((PetscObject)coarse_mat),n,gidxs,PETSC_COPY_VALUES,&col);CHKERRQ(ierr);
7922a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap,&gidxs);CHKERRQ(ierr);
7923a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingCreateIS(row,&rl2g);CHKERRQ(ierr);
7924a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingCreateIS(col,&cl2g);CHKERRQ(ierr);
7925a198735bSStefano Zampini         ierr = ISGetSize(row,&M);CHKERRQ(ierr);
7926a198735bSStefano Zampini         ierr = MatGetSize(coarse_mat,&N,NULL);CHKERRQ(ierr);
7927a198735bSStefano Zampini         ierr = ISDestroy(&row);CHKERRQ(ierr);
7928a198735bSStefano Zampini         ierr = ISDestroy(&col);CHKERRQ(ierr);
7929a198735bSStefano Zampini         ierr = MatCreate(PetscObjectComm((PetscObject)coarse_mat),&coarsedivudotp_is);CHKERRQ(ierr);
7930a198735bSStefano Zampini         ierr = MatSetType(coarsedivudotp_is,MATIS);CHKERRQ(ierr);
7931a198735bSStefano Zampini         ierr = MatSetSizes(coarsedivudotp_is,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr);
7932a198735bSStefano Zampini         ierr = MatSetLocalToGlobalMapping(coarsedivudotp_is,rl2g,cl2g);CHKERRQ(ierr);
7933a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingDestroy(&rl2g);CHKERRQ(ierr);
7934a198735bSStefano Zampini         ierr = ISLocalToGlobalMappingDestroy(&cl2g);CHKERRQ(ierr);
7935a198735bSStefano Zampini         ierr = MatISSetLocalMat(coarsedivudotp_is,coarsedivudotp);CHKERRQ(ierr);
7936a198735bSStefano Zampini         ierr = MatDestroy(&coarsedivudotp);CHKERRQ(ierr);
79378ae0ca82SStefano Zampini         ierr = PCBDDCSetDivergenceMat(pc_temp,coarsedivudotp_is,PETSC_FALSE,NULL);CHKERRQ(ierr);
7938a198735bSStefano Zampini         ierr = MatDestroy(&coarsedivudotp_is);CHKERRQ(ierr);
7939720d30f9SStefano Zampini         pcbddc_coarse->adaptive_userdefined = PETSC_TRUE;
794059e48ca4SStefano Zampini         if (pcbddc->adaptive_threshold < 1.0) pcbddc_coarse->deluxe_zerorows = PETSC_TRUE;
7941720d30f9SStefano Zampini       }
7942d4d8cf7bSStefano Zampini     }
79439881197aSStefano Zampini 
79443301b35fSStefano Zampini     /* propagate symmetry info of coarse matrix */
79455a16e3a0SStefano Zampini     ierr = MatSetOption(coarse_mat,MAT_STRUCTURALLY_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
79463301b35fSStefano Zampini     if (pc->pmat->symmetric_set) {
79473301b35fSStefano Zampini       ierr = MatSetOption(coarse_mat,MAT_SYMMETRIC,pc->pmat->symmetric);CHKERRQ(ierr);
79483301b35fSStefano Zampini     }
79493301b35fSStefano Zampini     if (pc->pmat->hermitian_set) {
79503301b35fSStefano Zampini       ierr = MatSetOption(coarse_mat,MAT_HERMITIAN,pc->pmat->hermitian);CHKERRQ(ierr);
79513301b35fSStefano Zampini     }
79523301b35fSStefano Zampini     if (pc->pmat->spd_set) {
79533301b35fSStefano Zampini       ierr = MatSetOption(coarse_mat,MAT_SPD,pc->pmat->spd);CHKERRQ(ierr);
79543301b35fSStefano Zampini     }
795527b6a85dSStefano Zampini     if (pcbddc->benign_saddle_point && !pcbddc->benign_have_null) {
795627b6a85dSStefano Zampini       ierr = MatSetOption(coarse_mat,MAT_SPD,PETSC_TRUE);CHKERRQ(ierr);
795727b6a85dSStefano Zampini     }
79586e683305SStefano Zampini     /* set operators */
79595f76c7aeSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr);
79606e683305SStefano Zampini     if (pcbddc->dbg_flag) {
79616e683305SStefano Zampini       ierr = PetscViewerASCIISubtractTab(dbg_viewer,2*pcbddc->current_level);CHKERRQ(ierr);
79626e683305SStefano Zampini     }
79636e683305SStefano Zampini   }
79641e0482f5SStefano Zampini   ierr = MatDestroy(&coarseG);CHKERRQ(ierr);
79656e683305SStefano Zampini   ierr = PetscFree(isarray);CHKERRQ(ierr);
7966b1ecc7b1SStefano Zampini #if 0
7967b9b85e73SStefano Zampini   {
7968b9b85e73SStefano Zampini     PetscViewer viewer;
7969b9b85e73SStefano Zampini     char filename[256];
7970b1ecc7b1SStefano Zampini     sprintf(filename,"coarse_mat_level%d.m",pcbddc->current_level);
7971b1ecc7b1SStefano Zampini     ierr = PetscViewerASCIIOpen(PetscObjectComm((PetscObject)coarse_mat),filename,&viewer);CHKERRQ(ierr);
79726a9046bcSBarry Smith     ierr = PetscViewerPushFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
7973b9b85e73SStefano Zampini     ierr = MatView(coarse_mat,viewer);CHKERRQ(ierr);
7974f159cad9SBarry Smith     ierr = PetscViewerPopFormat(viewer);CHKERRQ(ierr);
7975b9b85e73SStefano Zampini     ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr);
7976b9b85e73SStefano Zampini   }
7977b9b85e73SStefano Zampini #endif
7978f9eb5b7dSStefano Zampini 
797998a51de6SStefano Zampini   if (pcbddc->coarse_ksp) {
798098a51de6SStefano Zampini     Vec crhs,csol;
798104708bb6SStefano Zampini 
7982f347579bSStefano Zampini     ierr = KSPGetSolution(pcbddc->coarse_ksp,&csol);CHKERRQ(ierr);
7983f347579bSStefano Zampini     ierr = KSPGetRhs(pcbddc->coarse_ksp,&crhs);CHKERRQ(ierr);
7984f347579bSStefano Zampini     if (!csol) {
79852a7a6963SBarry Smith       ierr = MatCreateVecs(coarse_mat,&((pcbddc->coarse_ksp)->vec_sol),NULL);CHKERRQ(ierr);
7986f9eb5b7dSStefano Zampini     }
7987f347579bSStefano Zampini     if (!crhs) {
79882a7a6963SBarry Smith       ierr = MatCreateVecs(coarse_mat,NULL,&((pcbddc->coarse_ksp)->vec_rhs));CHKERRQ(ierr);
7989f347579bSStefano Zampini     }
7990b0f5fe93SStefano Zampini   }
79911ae86dd6SStefano Zampini   ierr = MatDestroy(&coarsedivudotp);CHKERRQ(ierr);
7992b0f5fe93SStefano Zampini 
7993b0f5fe93SStefano Zampini   /* compute null space for coarse solver if the benign trick has been requested */
7994b0f5fe93SStefano Zampini   if (pcbddc->benign_null) {
7995b0f5fe93SStefano Zampini 
7996b0f5fe93SStefano Zampini     ierr = VecSet(pcbddc->vec1_P,0.);CHKERRQ(ierr);
79974f1b2e48SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) {
79984f1b2e48SStefano Zampini       ierr = VecSetValue(pcbddc->vec1_P,pcbddc->local_primal_size-pcbddc->benign_n+i,1.0,INSERT_VALUES);CHKERRQ(ierr);
79994f1b2e48SStefano Zampini     }
8000b0f5fe93SStefano Zampini     ierr = VecAssemblyBegin(pcbddc->vec1_P);CHKERRQ(ierr);
8001b0f5fe93SStefano Zampini     ierr = VecAssemblyEnd(pcbddc->vec1_P);CHKERRQ(ierr);
8002b0f5fe93SStefano Zampini     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8003b0f5fe93SStefano Zampini     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8004b0f5fe93SStefano Zampini     if (coarse_mat) {
8005b0f5fe93SStefano Zampini       Vec         nullv;
8006b0f5fe93SStefano Zampini       PetscScalar *array,*array2;
8007b0f5fe93SStefano Zampini       PetscInt    nl;
8008b0f5fe93SStefano Zampini 
8009b0f5fe93SStefano Zampini       ierr = MatCreateVecs(coarse_mat,&nullv,NULL);CHKERRQ(ierr);
8010b0f5fe93SStefano Zampini       ierr = VecGetLocalSize(nullv,&nl);CHKERRQ(ierr);
8011b0f5fe93SStefano Zampini       ierr = VecGetArrayRead(pcbddc->coarse_vec,(const PetscScalar**)&array);CHKERRQ(ierr);
8012b0f5fe93SStefano Zampini       ierr = VecGetArray(nullv,&array2);CHKERRQ(ierr);
8013b0f5fe93SStefano Zampini       ierr = PetscMemcpy(array2,array,nl*sizeof(*array));CHKERRQ(ierr);
8014b0f5fe93SStefano Zampini       ierr = VecRestoreArray(nullv,&array2);CHKERRQ(ierr);
8015b0f5fe93SStefano Zampini       ierr = VecRestoreArrayRead(pcbddc->coarse_vec,(const PetscScalar**)&array);CHKERRQ(ierr);
8016b0f5fe93SStefano Zampini       ierr = VecNormalize(nullv,NULL);CHKERRQ(ierr);
8017b0f5fe93SStefano Zampini       ierr = MatNullSpaceCreate(PetscObjectComm((PetscObject)coarse_mat),PETSC_FALSE,1,&nullv,&CoarseNullSpace);CHKERRQ(ierr);
8018b0f5fe93SStefano Zampini       ierr = VecDestroy(&nullv);CHKERRQ(ierr);
8019b0f5fe93SStefano Zampini     }
8020b0f5fe93SStefano Zampini   }
8021b0f5fe93SStefano Zampini 
8022b0f5fe93SStefano Zampini   if (pcbddc->coarse_ksp) {
8023b0f5fe93SStefano Zampini     PetscBool ispreonly;
8024b0f5fe93SStefano Zampini 
8025b0f5fe93SStefano Zampini     if (CoarseNullSpace) {
8026b0f5fe93SStefano Zampini       PetscBool isnull;
8027b0f5fe93SStefano Zampini       ierr = MatNullSpaceTest(CoarseNullSpace,coarse_mat,&isnull);CHKERRQ(ierr);
8028bef83e63SStefano Zampini       if (isnull) {
8029b0f5fe93SStefano Zampini         ierr = MatSetNullSpace(coarse_mat,CoarseNullSpace);CHKERRQ(ierr);
8030b0f5fe93SStefano Zampini       }
8031bef83e63SStefano Zampini       /* TODO: add local nullspaces (if any) */
8032b0f5fe93SStefano Zampini     }
8033b0f5fe93SStefano Zampini     /* setup coarse ksp */
8034b0f5fe93SStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
8035cbcc2c2aSStefano Zampini     /* Check coarse problem if in debug mode or if solving with an iterative method */
8036cbcc2c2aSStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pcbddc->coarse_ksp,KSPPREONLY,&ispreonly);CHKERRQ(ierr);
80376e683305SStefano Zampini     if (pcbddc->dbg_flag || (!ispreonly && pcbddc->use_coarse_estimates) ) {
8038c8587f34SStefano Zampini       KSP       check_ksp;
80392b510759SStefano Zampini       KSPType   check_ksp_type;
8040c8587f34SStefano Zampini       PC        check_pc;
80416e683305SStefano Zampini       Vec       check_vec,coarse_vec;
80426a1308c2SStefano Zampini       PetscReal abs_infty_error,infty_error,lambda_min=1.0,lambda_max=1.0;
80432b510759SStefano Zampini       PetscInt  its;
80446e683305SStefano Zampini       PetscBool compute_eigs;
80456e683305SStefano Zampini       PetscReal *eigs_r,*eigs_c;
80466e683305SStefano Zampini       PetscInt  neigs;
80478e185a42SStefano Zampini       const char *prefix;
8048c8587f34SStefano Zampini 
80492b510759SStefano Zampini       /* Create ksp object suitable for estimation of extreme eigenvalues */
80506e683305SStefano Zampini       ierr = KSPCreate(PetscObjectComm((PetscObject)pcbddc->coarse_ksp),&check_ksp);CHKERRQ(ierr);
8051422a814eSBarry Smith       ierr = KSPSetErrorIfNotConverged(pcbddc->coarse_ksp,pc->erroriffailure);CHKERRQ(ierr);
805223ee1639SBarry Smith       ierr = KSPSetOperators(check_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr);
8053f4ddd8eeSStefano Zampini       ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
8054e4d548c7SStefano Zampini       /* prevent from setup unneeded object */
8055e4d548c7SStefano Zampini       ierr = KSPGetPC(check_ksp,&check_pc);CHKERRQ(ierr);
8056e4d548c7SStefano Zampini       ierr = PCSetType(check_pc,PCNONE);CHKERRQ(ierr);
80572b510759SStefano Zampini       if (ispreonly) {
80582b510759SStefano Zampini         check_ksp_type = KSPPREONLY;
80596e683305SStefano Zampini         compute_eigs = PETSC_FALSE;
80602b510759SStefano Zampini       } else {
8061cbcc2c2aSStefano Zampini         check_ksp_type = KSPGMRES;
80626e683305SStefano Zampini         compute_eigs = PETSC_TRUE;
8063c8587f34SStefano Zampini       }
8064c8587f34SStefano Zampini       ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
80656e683305SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,compute_eigs);CHKERRQ(ierr);
80666e683305SStefano Zampini       ierr = KSPSetComputeEigenvalues(check_ksp,compute_eigs);CHKERRQ(ierr);
80676e683305SStefano Zampini       ierr = KSPGMRESSetRestart(check_ksp,pcbddc->coarse_size+1);CHKERRQ(ierr);
8068a7dc3881SStefano Zampini       ierr = KSPGetOptionsPrefix(pcbddc->coarse_ksp,&prefix);CHKERRQ(ierr);
8069a7dc3881SStefano Zampini       ierr = KSPSetOptionsPrefix(check_ksp,prefix);CHKERRQ(ierr);
8070a7dc3881SStefano Zampini       ierr = KSPAppendOptionsPrefix(check_ksp,"check_");CHKERRQ(ierr);
8071a7dc3881SStefano Zampini       ierr = KSPSetFromOptions(check_ksp);CHKERRQ(ierr);
8072c8587f34SStefano Zampini       ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
8073c8587f34SStefano Zampini       ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
8074c8587f34SStefano Zampini       ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
8075c8587f34SStefano Zampini       /* create random vec */
80762701bc32SStefano Zampini       ierr = MatCreateVecs(coarse_mat,&coarse_vec,&check_vec);CHKERRQ(ierr);
8077c8587f34SStefano Zampini       ierr = VecSetRandom(check_vec,NULL);CHKERRQ(ierr);
80786e683305SStefano Zampini       ierr = MatMult(coarse_mat,check_vec,coarse_vec);CHKERRQ(ierr);
8079c8587f34SStefano Zampini       /* solve coarse problem */
80806e683305SStefano Zampini       ierr = KSPSolve(check_ksp,coarse_vec,coarse_vec);CHKERRQ(ierr);
8081cbcc2c2aSStefano Zampini       /* set eigenvalue estimation if preonly has not been requested */
80826e683305SStefano Zampini       if (compute_eigs) {
8083854ce69bSBarry Smith         ierr = PetscMalloc1(pcbddc->coarse_size+1,&eigs_r);CHKERRQ(ierr);
8084854ce69bSBarry Smith         ierr = PetscMalloc1(pcbddc->coarse_size+1,&eigs_c);CHKERRQ(ierr);
80856e683305SStefano Zampini         ierr = KSPComputeEigenvalues(check_ksp,pcbddc->coarse_size+1,eigs_r,eigs_c,&neigs);CHKERRQ(ierr);
80861ae86dd6SStefano Zampini         if (neigs) {
80876e683305SStefano Zampini           lambda_max = eigs_r[neigs-1];
80886e683305SStefano Zampini           lambda_min = eigs_r[0];
80896e683305SStefano Zampini           if (pcbddc->use_coarse_estimates) {
80902701bc32SStefano Zampini             if (lambda_max>=lambda_min) { /* using PETSC_SMALL since lambda_max == lambda_min is not allowed by KSPChebyshevSetEigenvalues */
80912701bc32SStefano Zampini               ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max+PETSC_SMALL,lambda_min);CHKERRQ(ierr);
8092cbcc2c2aSStefano Zampini               ierr = KSPRichardsonSetScale(pcbddc->coarse_ksp,2.0/(lambda_max+lambda_min));CHKERRQ(ierr);
8093cbcc2c2aSStefano Zampini             }
8094c8587f34SStefano Zampini           }
8095c8587f34SStefano Zampini         }
80961ae86dd6SStefano Zampini       }
8097cbcc2c2aSStefano Zampini 
8098c8587f34SStefano Zampini       /* check coarse problem residual error */
80996e683305SStefano Zampini       if (pcbddc->dbg_flag) {
81006e683305SStefano Zampini         PetscViewer dbg_viewer = PETSC_VIEWER_STDOUT_(PetscObjectComm((PetscObject)pcbddc->coarse_ksp));
81016e683305SStefano Zampini         ierr = PetscViewerASCIIAddTab(dbg_viewer,2*(pcbddc->current_level+1));CHKERRQ(ierr);
81026e683305SStefano Zampini         ierr = VecAXPY(check_vec,-1.0,coarse_vec);CHKERRQ(ierr);
8103c8587f34SStefano Zampini         ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
81046e683305SStefano Zampini         ierr = MatMult(coarse_mat,check_vec,coarse_vec);CHKERRQ(ierr);
81056e683305SStefano Zampini         ierr = VecNorm(coarse_vec,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
8106779c1cceSStefano Zampini         ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem details (use estimates %d)\n",pcbddc->use_coarse_estimates);CHKERRQ(ierr);
81076e683305SStefano Zampini         ierr = PetscObjectPrintClassNamePrefixType((PetscObject)(pcbddc->coarse_ksp),dbg_viewer);CHKERRQ(ierr);
81086e683305SStefano Zampini         ierr = PetscObjectPrintClassNamePrefixType((PetscObject)(check_pc),dbg_viewer);CHKERRQ(ierr);
81096e683305SStefano Zampini         ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem exact infty_error   : %1.6e\n",infty_error);CHKERRQ(ierr);
81106e683305SStefano Zampini         ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem residual infty_error: %1.6e\n",abs_infty_error);CHKERRQ(ierr);
8111b0f5fe93SStefano Zampini         if (CoarseNullSpace) {
8112b0f5fe93SStefano Zampini           ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem is singular\n");CHKERRQ(ierr);
8113b0f5fe93SStefano Zampini         }
81146e683305SStefano Zampini         if (compute_eigs) {
81156e683305SStefano Zampini           PetscReal          lambda_max_s,lambda_min_s;
8116b03ebc13SStefano Zampini           KSPConvergedReason reason;
8117deec49d1SStefano Zampini           ierr = KSPGetType(check_ksp,&check_ksp_type);CHKERRQ(ierr);
8118c8587f34SStefano Zampini           ierr = KSPGetIterationNumber(check_ksp,&its);CHKERRQ(ierr);
8119b03ebc13SStefano Zampini           ierr = KSPGetConvergedReason(check_ksp,&reason);CHKERRQ(ierr);
81206e683305SStefano Zampini           ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max_s,&lambda_min_s);CHKERRQ(ierr);
8121b03ebc13SStefano Zampini           ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem eigenvalues (estimated with %d iterations of %s, conv reason %d): %1.6e %1.6e (%1.6e %1.6e)\n",its,check_ksp_type,reason,lambda_min,lambda_max,lambda_min_s,lambda_max_s);CHKERRQ(ierr);
81226e683305SStefano Zampini           for (i=0;i<neigs;i++) {
81236e683305SStefano Zampini             ierr = PetscViewerASCIIPrintf(dbg_viewer,"%1.6e %1.6ei\n",eigs_r[i],eigs_c[i]);CHKERRQ(ierr);
8124c8587f34SStefano Zampini           }
81256e683305SStefano Zampini         }
81266e683305SStefano Zampini         ierr = PetscViewerFlush(dbg_viewer);CHKERRQ(ierr);
81276e683305SStefano Zampini         ierr = PetscViewerASCIISubtractTab(dbg_viewer,2*(pcbddc->current_level+1));CHKERRQ(ierr);
81286e683305SStefano Zampini       }
8129e4d548c7SStefano Zampini       ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
81302701bc32SStefano Zampini       ierr = VecDestroy(&coarse_vec);CHKERRQ(ierr);
8131c8587f34SStefano Zampini       ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
81326e683305SStefano Zampini       if (compute_eigs) {
81336e683305SStefano Zampini         ierr = PetscFree(eigs_r);CHKERRQ(ierr);
81346e683305SStefano Zampini         ierr = PetscFree(eigs_c);CHKERRQ(ierr);
8135c8587f34SStefano Zampini       }
81366e683305SStefano Zampini     }
81376e683305SStefano Zampini   }
8138bef83e63SStefano Zampini   ierr = MatNullSpaceDestroy(&CoarseNullSpace);CHKERRQ(ierr);
8139cbcc2c2aSStefano Zampini   /* print additional info */
8140cbcc2c2aSStefano Zampini   if (pcbddc->dbg_flag) {
81416e683305SStefano Zampini     /* waits until all processes reaches this point */
81426e683305SStefano Zampini     ierr = PetscBarrier((PetscObject)pc);CHKERRQ(ierr);
8143cbcc2c2aSStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Coarse solver setup completed at level %d\n",pcbddc->current_level);CHKERRQ(ierr);
8144cbcc2c2aSStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
8145cbcc2c2aSStefano Zampini   }
8146cbcc2c2aSStefano Zampini 
81472b510759SStefano Zampini   /* free memory */
8148fdc635d7SStefano Zampini   ierr = MatDestroy(&coarse_mat);CHKERRQ(ierr);
8149c8587f34SStefano Zampini   PetscFunctionReturn(0);
8150c8587f34SStefano Zampini }
8151674ae819SStefano Zampini 
8152f34684f1SStefano Zampini PetscErrorCode PCBDDCComputePrimalNumbering(PC pc,PetscInt* coarse_size_n,PetscInt** local_primal_indices_n)
8153f34684f1SStefano Zampini {
8154f34684f1SStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
8155f34684f1SStefano Zampini   PC_IS*         pcis = (PC_IS*)pc->data;
8156f34684f1SStefano Zampini   Mat_IS*        matis = (Mat_IS*)pc->pmat->data;
8157dc456d91SStefano Zampini   IS             subset,subset_mult,subset_n;
8158dc456d91SStefano Zampini   PetscInt       local_size,coarse_size=0;
815973be2a3aSStefano Zampini   PetscInt       *local_primal_indices=NULL;
8160dc456d91SStefano Zampini   const PetscInt *t_local_primal_indices;
8161f34684f1SStefano Zampini   PetscErrorCode ierr;
8162f34684f1SStefano Zampini 
8163f34684f1SStefano Zampini   PetscFunctionBegin;
8164f34684f1SStefano Zampini   /* Compute global number of coarse dofs */
81656c4ed002SBarry Smith   if (pcbddc->local_primal_size && !pcbddc->local_primal_ref_node) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"BDDC ConstraintsSetUp should be called first");
8166dc456d91SStefano Zampini   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(pc->pmat)),pcbddc->local_primal_size_cc,pcbddc->local_primal_ref_node,PETSC_COPY_VALUES,&subset_n);CHKERRQ(ierr);
81673bbff08aSStefano Zampini   ierr = ISLocalToGlobalMappingApplyIS(pcis->mapping,subset_n,&subset);CHKERRQ(ierr);
8168dc456d91SStefano Zampini   ierr = ISDestroy(&subset_n);CHKERRQ(ierr);
8169dc456d91SStefano Zampini   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(pc->pmat)),pcbddc->local_primal_size_cc,pcbddc->local_primal_ref_mult,PETSC_COPY_VALUES,&subset_mult);CHKERRQ(ierr);
81706583bcc1SStefano Zampini   ierr = ISRenumber(subset,subset_mult,&coarse_size,&subset_n);CHKERRQ(ierr);
8171dc456d91SStefano Zampini   ierr = ISDestroy(&subset);CHKERRQ(ierr);
8172dc456d91SStefano Zampini   ierr = ISDestroy(&subset_mult);CHKERRQ(ierr);
8173dc456d91SStefano Zampini   ierr = ISGetLocalSize(subset_n,&local_size);CHKERRQ(ierr);
81746c4ed002SBarry Smith   if (local_size != pcbddc->local_primal_size) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Invalid number of local primal indices computed %D != %D",local_size,pcbddc->local_primal_size);
8175dc456d91SStefano Zampini   ierr = PetscMalloc1(local_size,&local_primal_indices);CHKERRQ(ierr);
8176dc456d91SStefano Zampini   ierr = ISGetIndices(subset_n,&t_local_primal_indices);CHKERRQ(ierr);
8177dc456d91SStefano Zampini   ierr = PetscMemcpy(local_primal_indices,t_local_primal_indices,local_size*sizeof(PetscInt));CHKERRQ(ierr);
8178dc456d91SStefano Zampini   ierr = ISRestoreIndices(subset_n,&t_local_primal_indices);CHKERRQ(ierr);
8179dc456d91SStefano Zampini   ierr = ISDestroy(&subset_n);CHKERRQ(ierr);
8180f34684f1SStefano Zampini 
8181f34684f1SStefano Zampini   /* check numbering */
8182f34684f1SStefano Zampini   if (pcbddc->dbg_flag) {
8183019a44ceSStefano Zampini     PetscScalar coarsesum,*array,*array2;
8184dc456d91SStefano Zampini     PetscInt    i;
8185b9b85e73SStefano Zampini     PetscBool   set_error = PETSC_FALSE,set_error_reduced = PETSC_FALSE;
8186f34684f1SStefano Zampini 
8187f34684f1SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
8188f34684f1SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
8189f34684f1SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check coarse indices\n");CHKERRQ(ierr);
81901575c14dSBarry Smith     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
8191019a44ceSStefano Zampini     /* counter */
8192019a44ceSStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
8193019a44ceSStefano Zampini     ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
8194019a44ceSStefano Zampini     ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8195019a44ceSStefano Zampini     ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8196019a44ceSStefano Zampini     ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8197019a44ceSStefano Zampini     ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8198f34684f1SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
8199f34684f1SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
8200727cdba6SStefano Zampini       ierr = VecSetValue(pcis->vec1_N,pcbddc->primal_indices_local_idxs[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
8201f34684f1SStefano Zampini     }
8202f34684f1SStefano Zampini     ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr);
8203f34684f1SStefano Zampini     ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr);
8204f34684f1SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
8205e176bc59SStefano Zampini     ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8206e176bc59SStefano Zampini     ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8207e176bc59SStefano Zampini     ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8208e176bc59SStefano Zampini     ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8209f34684f1SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
8210019a44ceSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
8211f34684f1SStefano Zampini     for (i=0;i<pcis->n;i++) {
8212019a44ceSStefano Zampini       if (array[i] != 0.0 && array[i] != array2[i]) {
82132c66d082SStefano Zampini         PetscInt owned = (PetscInt)PetscRealPart(array[i]),gi;
821475c01103SStefano Zampini         PetscInt neigh = (PetscInt)PetscRealPart(array2[i]);
8215b9b85e73SStefano Zampini         set_error = PETSC_TRUE;
82162c66d082SStefano Zampini         ierr = ISLocalToGlobalMappingApply(pcis->mapping,1,&i,&gi);CHKERRQ(ierr);
82172c66d082SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d: local index %d (gid %d) owned by %d processes instead of %d!\n",PetscGlobalRank,i,gi,owned,neigh);CHKERRQ(ierr);
8218f34684f1SStefano Zampini       }
8219f34684f1SStefano Zampini     }
8220019a44ceSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
8221b2566f29SBarry Smith     ierr = MPIU_Allreduce(&set_error,&set_error_reduced,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
8222f34684f1SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
8223f34684f1SStefano Zampini     for (i=0;i<pcis->n;i++) {
8224f34684f1SStefano Zampini       if (PetscRealPart(array[i]) > 0.0) array[i] = 1.0/PetscRealPart(array[i]);
8225f34684f1SStefano Zampini     }
8226f34684f1SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
8227f34684f1SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
8228e176bc59SStefano Zampini     ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8229e176bc59SStefano Zampini     ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8230f34684f1SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
8231f34684f1SStefano Zampini     ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Size of coarse problem is %d (%lf)\n",coarse_size,PetscRealPart(coarsesum));CHKERRQ(ierr);
8232b9b85e73SStefano Zampini     if (pcbddc->dbg_flag > 1 || set_error_reduced) {
8233ca8b9ea9SStefano Zampini       PetscInt *gidxs;
8234ca8b9ea9SStefano Zampini 
8235ca8b9ea9SStefano Zampini       ierr = PetscMalloc1(pcbddc->local_primal_size,&gidxs);CHKERRQ(ierr);
82363bbff08aSStefano Zampini       ierr = ISLocalToGlobalMappingApply(pcis->mapping,pcbddc->local_primal_size,pcbddc->primal_indices_local_idxs,gidxs);CHKERRQ(ierr);
8237f34684f1SStefano Zampini       ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Distribution of local primal indices\n");CHKERRQ(ierr);
8238f34684f1SStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
8239f34684f1SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
8240f34684f1SStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) {
82414bc2dc4bSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"local_primal_indices[%d]=%d (%d,%d)\n",i,local_primal_indices[i],pcbddc->primal_indices_local_idxs[i],gidxs[i]);CHKERRQ(ierr);
8242f34684f1SStefano Zampini       }
8243f34684f1SStefano Zampini       ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
8244ca8b9ea9SStefano Zampini       ierr = PetscFree(gidxs);CHKERRQ(ierr);
8245f34684f1SStefano Zampini     }
8246f34684f1SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
82471575c14dSBarry Smith     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
8248302440fdSBarry Smith     if (set_error_reduced) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"BDDC Numbering of coarse dofs failed");
8249f34684f1SStefano Zampini   }
82508bec7fa6SStefano Zampini   /* ierr = PetscPrintf(PetscObjectComm((PetscObject)pc),"Size of coarse problem is %d\n",coarse_size);CHKERRQ(ierr); */
8251f34684f1SStefano Zampini   /* get back data */
8252f34684f1SStefano Zampini   *coarse_size_n = coarse_size;
8253f34684f1SStefano Zampini   *local_primal_indices_n = local_primal_indices;
8254674ae819SStefano Zampini   PetscFunctionReturn(0);
8255674ae819SStefano Zampini }
8256674ae819SStefano Zampini 
8257a7dc3881SStefano Zampini PetscErrorCode PCBDDCGlobalToLocal(VecScatter g2l_ctx,Vec gwork, Vec lwork, IS globalis, IS* localis)
8258e456f2a8SStefano Zampini {
8259e456f2a8SStefano Zampini   IS             localis_t;
8260a7dc3881SStefano Zampini   PetscInt       i,lsize,*idxs,n;
8261e456f2a8SStefano Zampini   PetscScalar    *vals;
8262e456f2a8SStefano Zampini   PetscErrorCode ierr;
8263e456f2a8SStefano Zampini 
8264e456f2a8SStefano Zampini   PetscFunctionBegin;
8265a7dc3881SStefano Zampini   /* get indices in local ordering exploiting local to global map */
8266e456f2a8SStefano Zampini   ierr = ISGetLocalSize(globalis,&lsize);CHKERRQ(ierr);
8267854ce69bSBarry Smith   ierr = PetscMalloc1(lsize,&vals);CHKERRQ(ierr);
8268e456f2a8SStefano Zampini   for (i=0;i<lsize;i++) vals[i] = 1.0;
8269e456f2a8SStefano Zampini   ierr = ISGetIndices(globalis,(const PetscInt**)&idxs);CHKERRQ(ierr);
8270a7dc3881SStefano Zampini   ierr = VecSet(gwork,0.0);CHKERRQ(ierr);
8271a7dc3881SStefano Zampini   ierr = VecSet(lwork,0.0);CHKERRQ(ierr);
82721035eff8SStefano Zampini   if (idxs) { /* multilevel guard */
8273a7dc3881SStefano Zampini     ierr = VecSetValues(gwork,lsize,idxs,vals,INSERT_VALUES);CHKERRQ(ierr);
82741035eff8SStefano Zampini   }
8275a7dc3881SStefano Zampini   ierr = VecAssemblyBegin(gwork);CHKERRQ(ierr);
8276e456f2a8SStefano Zampini   ierr = ISRestoreIndices(globalis,(const PetscInt**)&idxs);CHKERRQ(ierr);
8277e456f2a8SStefano Zampini   ierr = PetscFree(vals);CHKERRQ(ierr);
8278a7dc3881SStefano Zampini   ierr = VecAssemblyEnd(gwork);CHKERRQ(ierr);
8279a7dc3881SStefano Zampini   /* now compute set in local ordering */
8280a7dc3881SStefano Zampini   ierr = VecScatterBegin(g2l_ctx,gwork,lwork,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8281a7dc3881SStefano Zampini   ierr = VecScatterEnd(g2l_ctx,gwork,lwork,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8282a7dc3881SStefano Zampini   ierr = VecGetArrayRead(lwork,(const PetscScalar**)&vals);CHKERRQ(ierr);
8283a7dc3881SStefano Zampini   ierr = VecGetSize(lwork,&n);CHKERRQ(ierr);
8284a7dc3881SStefano Zampini   for (i=0,lsize=0;i<n;i++) {
8285ff92baa0SMatthew G. Knepley     if (PetscRealPart(vals[i]) > 0.5) {
8286e456f2a8SStefano Zampini       lsize++;
8287e456f2a8SStefano Zampini     }
8288e456f2a8SStefano Zampini   }
8289854ce69bSBarry Smith   ierr = PetscMalloc1(lsize,&idxs);CHKERRQ(ierr);
8290a7dc3881SStefano Zampini   for (i=0,lsize=0;i<n;i++) {
8291ff92baa0SMatthew G. Knepley     if (PetscRealPart(vals[i]) > 0.5) {
8292e456f2a8SStefano Zampini       idxs[lsize++] = i;
8293e456f2a8SStefano Zampini     }
8294e456f2a8SStefano Zampini   }
8295a7dc3881SStefano Zampini   ierr = VecRestoreArrayRead(lwork,(const PetscScalar**)&vals);CHKERRQ(ierr);
8296a7dc3881SStefano Zampini   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)gwork),lsize,idxs,PETSC_OWN_POINTER,&localis_t);CHKERRQ(ierr);
8297e456f2a8SStefano Zampini   *localis = localis_t;
8298e456f2a8SStefano Zampini   PetscFunctionReturn(0);
8299e456f2a8SStefano Zampini }
8300906d46d4SStefano Zampini 
830108122e43SStefano Zampini PetscErrorCode PCBDDCSetUpSubSchurs(PC pc)
8302b96c3477SStefano Zampini {
8303a64f4aa4SStefano Zampini   PC_IS               *pcis=(PC_IS*)pc->data;
8304b96c3477SStefano Zampini   PC_BDDC             *pcbddc=(PC_BDDC*)pc->data;
8305b96c3477SStefano Zampini   PCBDDCSubSchurs     sub_schurs=pcbddc->sub_schurs;
8306a64f4aa4SStefano Zampini   Mat                 S_j;
8307b96c3477SStefano Zampini   PetscInt            *used_xadj,*used_adjncy;
8308b96c3477SStefano Zampini   PetscBool           free_used_adj;
8309b96c3477SStefano Zampini   PetscErrorCode      ierr;
8310b96c3477SStefano Zampini 
8311b96c3477SStefano Zampini   PetscFunctionBegin;
8312b96c3477SStefano Zampini   /* decide the adjacency to be used for determining internal problems for local schur on subsets */
8313b96c3477SStefano Zampini   free_used_adj = PETSC_FALSE;
831408122e43SStefano Zampini   if (pcbddc->sub_schurs_layers == -1) {
8315b96c3477SStefano Zampini     used_xadj = NULL;
8316b96c3477SStefano Zampini     used_adjncy = NULL;
8317b96c3477SStefano Zampini   } else {
831808122e43SStefano Zampini     if (pcbddc->sub_schurs_use_useradj && pcbddc->mat_graph->xadj) {
831908122e43SStefano Zampini       used_xadj = pcbddc->mat_graph->xadj;
832008122e43SStefano Zampini       used_adjncy = pcbddc->mat_graph->adjncy;
832108122e43SStefano Zampini     } else if (pcbddc->computed_rowadj) {
8322b96c3477SStefano Zampini       used_xadj = pcbddc->mat_graph->xadj;
8323b96c3477SStefano Zampini       used_adjncy = pcbddc->mat_graph->adjncy;
8324b96c3477SStefano Zampini     } else {
83252fffb893SStefano Zampini       PetscBool      flg_row=PETSC_FALSE;
8326b96c3477SStefano Zampini       const PetscInt *xadj,*adjncy;
8327b96c3477SStefano Zampini       PetscInt       nvtxs;
8328b96c3477SStefano Zampini 
83292fffb893SStefano Zampini       ierr = MatGetRowIJ(pcbddc->local_mat,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
83302fffb893SStefano Zampini       if (flg_row) {
8331b96c3477SStefano Zampini         ierr = PetscMalloc2(nvtxs+1,&used_xadj,xadj[nvtxs],&used_adjncy);CHKERRQ(ierr);
8332b96c3477SStefano Zampini         ierr = PetscMemcpy(used_xadj,xadj,(nvtxs+1)*sizeof(*xadj));CHKERRQ(ierr);
8333b96c3477SStefano Zampini         ierr = PetscMemcpy(used_adjncy,adjncy,(xadj[nvtxs])*sizeof(*adjncy));CHKERRQ(ierr);
8334b96c3477SStefano Zampini         free_used_adj = PETSC_TRUE;
83352fffb893SStefano Zampini       } else {
83362fffb893SStefano Zampini         pcbddc->sub_schurs_layers = -1;
83372fffb893SStefano Zampini         used_xadj = NULL;
83382fffb893SStefano Zampini         used_adjncy = NULL;
83392fffb893SStefano Zampini       }
83402fffb893SStefano Zampini       ierr = MatRestoreRowIJ(pcbddc->local_mat,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
8341b96c3477SStefano Zampini     }
8342b96c3477SStefano Zampini   }
8343d5574798SStefano Zampini 
8344d5574798SStefano Zampini   /* setup sub_schurs data */
8345a64f4aa4SStefano Zampini   ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr);
8346df4d28bfSStefano Zampini   if (!sub_schurs->schur_explicit) {
8347df4d28bfSStefano Zampini     /* pcbddc->ksp_D up to date only if not using MatFactor with Schur complement support */
8348a64f4aa4SStefano Zampini     ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr);
834991af6908SStefano Zampini     ierr = PCBDDCSubSchursSetUp(sub_schurs,NULL,S_j,PETSC_FALSE,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,NULL,pcbddc->adaptive_selection,PETSC_FALSE,PETSC_FALSE,0,NULL,NULL,NULL,NULL);CHKERRQ(ierr);
8350a64f4aa4SStefano Zampini   } else {
835172b8c272SStefano Zampini     Mat       change = NULL;
83529d54b7f4SStefano Zampini     Vec       scaling = NULL;
8353111315fdSstefano_zampini     IS        change_primal = NULL, iP;
8354111315fdSstefano_zampini     PetscInt  benign_n;
8355111315fdSstefano_zampini     PetscBool reuse_solvers = (PetscBool)!pcbddc->use_change_of_basis;
8356111315fdSstefano_zampini     PetscBool isseqaij,need_change = PETSC_FALSE;
8357111315fdSstefano_zampini     PetscBool discrete_harmonic = PETSC_FALSE;
8358a3df083aSStefano Zampini 
83595feab87aSStefano Zampini     if (!pcbddc->use_vertices && reuse_solvers) {
83605feab87aSStefano Zampini       PetscInt n_vertices;
83615feab87aSStefano Zampini 
83625feab87aSStefano Zampini       ierr = ISGetLocalSize(sub_schurs->is_vertices,&n_vertices);CHKERRQ(ierr);
83632034aafcSStefano Zampini       reuse_solvers = (PetscBool)!n_vertices;
83645feab87aSStefano Zampini     }
836504708bb6SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pcbddc->local_mat,MATSEQAIJ,&isseqaij);CHKERRQ(ierr);
836604708bb6SStefano Zampini     if (!isseqaij) {
836704708bb6SStefano Zampini       Mat_IS* matis = (Mat_IS*)pc->pmat->data;
836804708bb6SStefano Zampini       if (matis->A == pcbddc->local_mat) {
836904708bb6SStefano Zampini         ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
837004708bb6SStefano Zampini         ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr);
837104708bb6SStefano Zampini       } else {
8372511c6705SHong Zhang         ierr = MatConvert(pcbddc->local_mat,MATSEQAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr);
837304708bb6SStefano Zampini       }
837404708bb6SStefano Zampini     }
8375a3df083aSStefano Zampini     if (!pcbddc->benign_change_explicit) {
8376a3df083aSStefano Zampini       benign_n = pcbddc->benign_n;
8377ca92afb2SStefano Zampini     } else {
8378a3df083aSStefano Zampini       benign_n = 0;
8379ca92afb2SStefano Zampini     }
8380b7ab4a40SStefano Zampini     /* sub_schurs->change is a local object; instead, PCBDDCConstraintsSetUp and the quantities used in the test below are logically collective on pc.
8381b7ab4a40SStefano Zampini        We need a global reduction to avoid possible deadlocks.
8382b7ab4a40SStefano Zampini        We assume that sub_schurs->change is created once, and then reused for different solves, unless the topography has been recomputed */
838372b8c272SStefano Zampini     if (pcbddc->adaptive_userdefined || (pcbddc->deluxe_zerorows && !pcbddc->use_change_of_basis)) {
838422db5ddcSStefano Zampini       PetscBool have_loc_change = (PetscBool)(!!sub_schurs->change);
8385b7ab4a40SStefano Zampini       ierr = MPIU_Allreduce(&have_loc_change,&need_change,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
838622db5ddcSStefano Zampini       need_change = (PetscBool)(!need_change);
8387b7ab4a40SStefano Zampini     }
8388b7ab4a40SStefano Zampini     /* If the user defines additional constraints, we import them here.
8389b7ab4a40SStefano Zampini        We need to compute the change of basis according to the quadrature weights attached to pmat via MatSetNearNullSpace, and this could not be done (at the moment) without some hacking */
8390b7ab4a40SStefano Zampini     if (need_change) {
839188c03ad3SStefano Zampini       PC_IS   *pcisf;
839288c03ad3SStefano Zampini       PC_BDDC *pcbddcf;
839388c03ad3SStefano Zampini       PC      pcf;
839488c03ad3SStefano Zampini 
8395e4d548c7SStefano Zampini       if (pcbddc->sub_schurs_rebuild) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot compute change of basis with a different graph");
839688c03ad3SStefano Zampini       ierr = PCCreate(PetscObjectComm((PetscObject)pc),&pcf);CHKERRQ(ierr);
839788c03ad3SStefano Zampini       ierr = PCSetOperators(pcf,pc->mat,pc->pmat);CHKERRQ(ierr);
839888c03ad3SStefano Zampini       ierr = PCSetType(pcf,PCBDDC);CHKERRQ(ierr);
8399b9be95fcSstefano_zampini 
840088c03ad3SStefano Zampini       /* hacks */
840188c03ad3SStefano Zampini       pcisf                        = (PC_IS*)pcf->data;
840272b8c272SStefano Zampini       pcisf->is_B_local            = pcis->is_B_local;
840372b8c272SStefano Zampini       pcisf->vec1_N                = pcis->vec1_N;
840472b8c272SStefano Zampini       pcisf->BtoNmap               = pcis->BtoNmap;
840572b8c272SStefano Zampini       pcisf->n                     = pcis->n;
840672b8c272SStefano Zampini       pcisf->n_B                   = pcis->n_B;
840788c03ad3SStefano Zampini       pcbddcf                      = (PC_BDDC*)pcf->data;
840888c03ad3SStefano Zampini       ierr                         = PetscFree(pcbddcf->mat_graph);CHKERRQ(ierr);
840988c03ad3SStefano Zampini       pcbddcf->mat_graph           = pcbddc->mat_graph;
841088c03ad3SStefano Zampini       pcbddcf->use_faces           = PETSC_TRUE;
841188c03ad3SStefano Zampini       pcbddcf->use_change_of_basis = PETSC_TRUE;
841288c03ad3SStefano Zampini       pcbddcf->use_change_on_faces = PETSC_TRUE;
841372b8c272SStefano Zampini       pcbddcf->use_qr_single       = PETSC_TRUE;
841488c03ad3SStefano Zampini       pcbddcf->fake_change         = PETSC_TRUE;
8415b9be95fcSstefano_zampini 
8416b9be95fcSstefano_zampini       /* setup constraints so that we can get information on primal vertices and change of basis (in local numbering) */
841788c03ad3SStefano Zampini       ierr = PCBDDCConstraintsSetUp(pcf);CHKERRQ(ierr);
841872b8c272SStefano Zampini       sub_schurs->change_with_qr = pcbddcf->use_qr_single;
841972b8c272SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddcf->n_vertices,pcbddcf->local_primal_ref_node,PETSC_COPY_VALUES,&change_primal);CHKERRQ(ierr);
842072b8c272SStefano Zampini       change = pcbddcf->ConstraintMatrix;
842172b8c272SStefano Zampini       pcbddcf->ConstraintMatrix = NULL;
8422b9be95fcSstefano_zampini 
842388c03ad3SStefano Zampini       /* free unneeded memory allocated in PCBDDCConstraintsSetUp */
842472b8c272SStefano Zampini       ierr = PetscFree(pcbddcf->sub_schurs);CHKERRQ(ierr);
842588c03ad3SStefano Zampini       ierr = MatNullSpaceDestroy(&pcbddcf->onearnullspace);CHKERRQ(ierr);
842688c03ad3SStefano Zampini       ierr = PetscFree2(pcbddcf->local_primal_ref_node,pcbddcf->local_primal_ref_mult);CHKERRQ(ierr);
842788c03ad3SStefano Zampini       ierr = PetscFree(pcbddcf->primal_indices_local_idxs);CHKERRQ(ierr);
842888c03ad3SStefano Zampini       ierr = PetscFree(pcbddcf->onearnullvecs_state);CHKERRQ(ierr);
842988c03ad3SStefano Zampini       ierr = PetscFree(pcf->data);CHKERRQ(ierr);
843088c03ad3SStefano Zampini       pcf->ops->destroy = NULL;
8431b9be95fcSstefano_zampini       pcf->ops->reset   = NULL;
843288c03ad3SStefano Zampini       ierr = PCDestroy(&pcf);CHKERRQ(ierr);
843388c03ad3SStefano Zampini     }
84349d54b7f4SStefano Zampini     if (!pcbddc->use_deluxe_scaling) scaling = pcis->D;
8435111315fdSstefano_zampini 
8436111315fdSstefano_zampini     ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr);
8437111315fdSstefano_zampini     if (iP) {
8438111315fdSstefano_zampini       ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)iP),sub_schurs->prefix,"BDDC sub_schurs options","PC");CHKERRQ(ierr);
8439111315fdSstefano_zampini       ierr = PetscOptionsBool("-sub_schurs_discrete_harmonic",NULL,NULL,discrete_harmonic,&discrete_harmonic,NULL);CHKERRQ(ierr);
8440111315fdSstefano_zampini       ierr = PetscOptionsEnd();CHKERRQ(ierr);
8441111315fdSstefano_zampini     }
8442111315fdSstefano_zampini     if (discrete_harmonic) {
8443111315fdSstefano_zampini       Mat A;
8444111315fdSstefano_zampini       ierr = MatDuplicate(pcbddc->local_mat,MAT_COPY_VALUES,&A);CHKERRQ(ierr);
8445111315fdSstefano_zampini       ierr = MatZeroRowsColumnsIS(A,iP,1.0,NULL,NULL);CHKERRQ(ierr);
8446111315fdSstefano_zampini       ierr = PetscObjectCompose((PetscObject)A,"__KSPFETIDP_iP",(PetscObject)iP);CHKERRQ(ierr);
8447111315fdSstefano_zampini       ierr = PCBDDCSubSchursSetUp(sub_schurs,A,S_j,pcbddc->sub_schurs_exact_schur,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,scaling,pcbddc->adaptive_selection,reuse_solvers,pcbddc->benign_saddle_point,benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_zerodiag_subs,change,change_primal);CHKERRQ(ierr);
8448111315fdSstefano_zampini       ierr = MatDestroy(&A);CHKERRQ(ierr);
8449111315fdSstefano_zampini     } else {
845091af6908SStefano Zampini       ierr = PCBDDCSubSchursSetUp(sub_schurs,pcbddc->local_mat,S_j,pcbddc->sub_schurs_exact_schur,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,scaling,pcbddc->adaptive_selection,reuse_solvers,pcbddc->benign_saddle_point,benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_zerodiag_subs,change,change_primal);CHKERRQ(ierr);
8451111315fdSstefano_zampini     }
845272b8c272SStefano Zampini     ierr = MatDestroy(&change);CHKERRQ(ierr);
845372b8c272SStefano Zampini     ierr = ISDestroy(&change_primal);CHKERRQ(ierr);
8454ca92afb2SStefano Zampini   }
8455d12d3064SStefano Zampini   ierr = MatDestroy(&S_j);CHKERRQ(ierr);
8456b96c3477SStefano Zampini 
8457b96c3477SStefano Zampini   /* free adjacency */
8458b96c3477SStefano Zampini   if (free_used_adj) {
8459b96c3477SStefano Zampini     ierr = PetscFree2(used_xadj,used_adjncy);CHKERRQ(ierr);
8460b96c3477SStefano Zampini   }
8461b96c3477SStefano Zampini   PetscFunctionReturn(0);
8462b96c3477SStefano Zampini }
8463b96c3477SStefano Zampini 
846408122e43SStefano Zampini PetscErrorCode PCBDDCInitSubSchurs(PC pc)
8465b96c3477SStefano Zampini {
8466b96c3477SStefano Zampini   PC_IS               *pcis=(PC_IS*)pc->data;
8467b96c3477SStefano Zampini   PC_BDDC             *pcbddc=(PC_BDDC*)pc->data;
8468b96c3477SStefano Zampini   PCBDDCGraph         graph;
8469b96c3477SStefano Zampini   PetscErrorCode      ierr;
8470b96c3477SStefano Zampini 
8471b96c3477SStefano Zampini   PetscFunctionBegin;
8472b96c3477SStefano Zampini   /* attach interface graph for determining subsets */
847308122e43SStefano Zampini   if (pcbddc->sub_schurs_rebuild) { /* in case rebuild has been requested, it uses a graph generated only by the neighbouring information */
84743301b35fSStefano Zampini     IS       verticesIS,verticescomm;
84753301b35fSStefano Zampini     PetscInt vsize,*idxs;
8476b96c3477SStefano Zampini 
8477b96c3477SStefano Zampini     ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&verticesIS);CHKERRQ(ierr);
84783301b35fSStefano Zampini     ierr = ISGetSize(verticesIS,&vsize);CHKERRQ(ierr);
84793301b35fSStefano Zampini     ierr = ISGetIndices(verticesIS,(const PetscInt**)&idxs);CHKERRQ(ierr);
84803301b35fSStefano Zampini     ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),vsize,idxs,PETSC_COPY_VALUES,&verticescomm);CHKERRQ(ierr);
84813301b35fSStefano Zampini     ierr = ISRestoreIndices(verticesIS,(const PetscInt**)&idxs);CHKERRQ(ierr);
8482c8272957SStefano Zampini     ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&verticesIS);CHKERRQ(ierr);
8483b96c3477SStefano Zampini     ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr);
8484be12c134Sstefano_zampini     ierr = PCBDDCGraphInit(graph,pcbddc->mat_graph->l2gmap,pcbddc->mat_graph->nvtxs_global,pcbddc->graphmaxcount);CHKERRQ(ierr);
8485441e0de0SStefano Zampini     ierr = PCBDDCGraphSetUp(graph,pcbddc->mat_graph->custom_minimal_size,NULL,pcbddc->DirichletBoundariesLocal,0,NULL,verticescomm);CHKERRQ(ierr);
84863301b35fSStefano Zampini     ierr = ISDestroy(&verticescomm);CHKERRQ(ierr);
8487b96c3477SStefano Zampini     ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr);
8488b96c3477SStefano Zampini   } else {
8489b96c3477SStefano Zampini     graph = pcbddc->mat_graph;
8490b96c3477SStefano Zampini   }
8491e4d548c7SStefano Zampini   /* print some info */
84925c643e28SStefano Zampini   if (pcbddc->dbg_flag && !pcbddc->sub_schurs_rebuild) {
8493e4d548c7SStefano Zampini     IS       vertices;
8494e4d548c7SStefano Zampini     PetscInt nv,nedges,nfaces;
8495c8272957SStefano Zampini     ierr = PCBDDCGraphASCIIView(graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr);
8496e4d548c7SStefano Zampini     ierr = PCBDDCGraphGetCandidatesIS(graph,&nfaces,NULL,&nedges,NULL,&vertices);CHKERRQ(ierr);
8497e4d548c7SStefano Zampini     ierr = ISGetSize(vertices,&nv);CHKERRQ(ierr);
8498e4d548c7SStefano Zampini     ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
8499e4d548c7SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
8500e4d548c7SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate vertices (%d)\n",PetscGlobalRank,nv,pcbddc->use_vertices);CHKERRQ(ierr);
8501e4d548c7SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate edges    (%d)\n",PetscGlobalRank,nedges,pcbddc->use_edges);CHKERRQ(ierr);
8502e4d548c7SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate faces    (%d)\n",PetscGlobalRank,nfaces,pcbddc->use_faces);CHKERRQ(ierr);
8503e4d548c7SStefano Zampini     ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr);
8504e4d548c7SStefano Zampini     ierr = PetscViewerASCIIPopSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr);
8505c8272957SStefano Zampini     ierr = PCBDDCGraphRestoreCandidatesIS(graph,&nfaces,NULL,&nedges,NULL,&vertices);CHKERRQ(ierr);
8506e4d548c7SStefano Zampini   }
8507b96c3477SStefano Zampini 
8508b96c3477SStefano Zampini   /* sub_schurs init */
8509b334f244SStefano Zampini   if (!pcbddc->sub_schurs) {
8510b334f244SStefano Zampini     ierr = PCBDDCSubSchursCreate(&pcbddc->sub_schurs);CHKERRQ(ierr);
8511b334f244SStefano Zampini   }
85128b6046baSStefano Zampini   ierr = PCBDDCSubSchursInit(pcbddc->sub_schurs,pcis->is_I_local,pcis->is_B_local,graph,pcis->BtoNmap,pcbddc->sub_schurs_rebuild);CHKERRQ(ierr);
8513e62b6521Sstefano_zampini   pcbddc->sub_schurs->prefix = ((PetscObject)pc)->prefix;
8514a64f4aa4SStefano Zampini 
8515b96c3477SStefano Zampini   /* free graph struct */
851608122e43SStefano Zampini   if (pcbddc->sub_schurs_rebuild) {
8517b96c3477SStefano Zampini     ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr);
8518b96c3477SStefano Zampini   }
8519b96c3477SStefano Zampini   PetscFunctionReturn(0);
8520b96c3477SStefano Zampini }
8521fa34dd3eSStefano Zampini 
8522fa34dd3eSStefano Zampini PetscErrorCode PCBDDCCheckOperator(PC pc)
8523fa34dd3eSStefano Zampini {
8524fa34dd3eSStefano Zampini   PC_IS               *pcis=(PC_IS*)pc->data;
8525fa34dd3eSStefano Zampini   PC_BDDC             *pcbddc=(PC_BDDC*)pc->data;
8526fa34dd3eSStefano Zampini   PetscErrorCode      ierr;
8527fa34dd3eSStefano Zampini 
8528fa34dd3eSStefano Zampini   PetscFunctionBegin;
8529fa34dd3eSStefano Zampini   if (pcbddc->n_vertices == pcbddc->local_primal_size) {
8530fa34dd3eSStefano Zampini     IS             zerodiag = NULL;
85314f1b2e48SStefano Zampini     Mat            S_j,B0_B=NULL;
8532fa34dd3eSStefano Zampini     Vec            dummy_vec=NULL,vec_check_B,vec_scale_P;
85334f1b2e48SStefano Zampini     PetscScalar    *p0_check,*array,*array2;
853475c01103SStefano Zampini     PetscReal      norm;
8535fa34dd3eSStefano Zampini     PetscInt       i;
8536fa34dd3eSStefano Zampini 
8537fa34dd3eSStefano Zampini     /* B0 and B0_B */
8538fa34dd3eSStefano Zampini     if (zerodiag) {
8539fa34dd3eSStefano Zampini       IS       dummy;
8540fa34dd3eSStefano Zampini 
85414f1b2e48SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&dummy);CHKERRQ(ierr);
85427dae84e0SHong Zhang       ierr = MatCreateSubMatrix(pcbddc->benign_B0,dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr);
8543fa34dd3eSStefano Zampini       ierr = MatCreateVecs(B0_B,NULL,&dummy_vec);CHKERRQ(ierr);
8544fa34dd3eSStefano Zampini       ierr = ISDestroy(&dummy);CHKERRQ(ierr);
8545fa34dd3eSStefano Zampini     }
8546fa34dd3eSStefano Zampini     /* I need a primal vector to scale primal nodes since BDDC sums contibutions */
8547fa34dd3eSStefano Zampini     ierr = VecDuplicate(pcbddc->vec1_P,&vec_scale_P);CHKERRQ(ierr);
8548fa34dd3eSStefano Zampini     ierr = VecSet(pcbddc->vec1_P,1.0);CHKERRQ(ierr);
8549fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8550fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8551fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,vec_scale_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8552fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,vec_scale_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8553fa34dd3eSStefano Zampini     ierr = VecReciprocal(vec_scale_P);CHKERRQ(ierr);
8554fa34dd3eSStefano Zampini     /* S_j */
8555fa34dd3eSStefano Zampini     ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr);
8556fa34dd3eSStefano Zampini     ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr);
8557fa34dd3eSStefano Zampini 
8558fa34dd3eSStefano Zampini     /* mimic vector in \widetilde{W}_\Gamma */
8559fa34dd3eSStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,NULL);CHKERRQ(ierr);
8560fa34dd3eSStefano Zampini     /* continuous in primal space */
8561fa34dd3eSStefano Zampini     ierr = VecSetRandom(pcbddc->coarse_vec,NULL);CHKERRQ(ierr);
8562fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8563fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8564fa34dd3eSStefano Zampini     ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
85654f1b2e48SStefano Zampini     ierr = PetscCalloc1(pcbddc->benign_n,&p0_check);CHKERRQ(ierr);
85664f1b2e48SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) p0_check[i] = array[pcbddc->local_primal_size-pcbddc->benign_n+i];
8567fa34dd3eSStefano Zampini     ierr = VecSetValues(pcis->vec1_N,pcbddc->local_primal_size,pcbddc->local_primal_ref_node,array,INSERT_VALUES);CHKERRQ(ierr);
8568fa34dd3eSStefano Zampini     ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
8569fa34dd3eSStefano Zampini     ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr);
8570fa34dd3eSStefano Zampini     ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr);
8571fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8572fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8573fa34dd3eSStefano Zampini     ierr = VecDuplicate(pcis->vec2_B,&vec_check_B);CHKERRQ(ierr);
8574fa34dd3eSStefano Zampini     ierr = VecCopy(pcis->vec2_B,vec_check_B);CHKERRQ(ierr);
8575fa34dd3eSStefano Zampini 
8576fa34dd3eSStefano Zampini     /* assemble rhs for coarse problem */
8577fa34dd3eSStefano Zampini     /* widetilde{S}_\Gamma w_\Gamma + \widetilde{B0}^T_B p0 */
8578fa34dd3eSStefano Zampini     /* local with Schur */
8579fa34dd3eSStefano Zampini     ierr = MatMult(S_j,pcis->vec2_B,pcis->vec1_B);CHKERRQ(ierr);
8580fa34dd3eSStefano Zampini     if (zerodiag) {
8581fa34dd3eSStefano Zampini       ierr = VecGetArray(dummy_vec,&array);CHKERRQ(ierr);
85824f1b2e48SStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) array[i] = p0_check[i];
8583fa34dd3eSStefano Zampini       ierr = VecRestoreArray(dummy_vec,&array);CHKERRQ(ierr);
8584fa34dd3eSStefano Zampini       ierr = MatMultTransposeAdd(B0_B,dummy_vec,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
8585fa34dd3eSStefano Zampini     }
8586fa34dd3eSStefano Zampini     /* sum on primal nodes the local contributions */
8587fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8588fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8589fa34dd3eSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
8590fa34dd3eSStefano Zampini     ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
8591fa34dd3eSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) array2[i] = array[pcbddc->local_primal_ref_node[i]];
8592fa34dd3eSStefano Zampini     ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
8593fa34dd3eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
8594fa34dd3eSStefano Zampini     ierr = VecSet(pcbddc->coarse_vec,0.);CHKERRQ(ierr);
8595fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8596fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8597fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8598fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8599fa34dd3eSStefano Zampini     ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
8600fa34dd3eSStefano Zampini     /* scale primal nodes (BDDC sums contibutions) */
8601fa34dd3eSStefano Zampini     ierr = VecPointwiseMult(pcbddc->vec1_P,vec_scale_P,pcbddc->vec1_P);CHKERRQ(ierr);
8602fa34dd3eSStefano Zampini     ierr = VecSetValues(pcis->vec1_N,pcbddc->local_primal_size,pcbddc->local_primal_ref_node,array,INSERT_VALUES);CHKERRQ(ierr);
8603fa34dd3eSStefano Zampini     ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
8604fa34dd3eSStefano Zampini     ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr);
8605fa34dd3eSStefano Zampini     ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr);
8606fa34dd3eSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8607fa34dd3eSStefano Zampini     ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8608fa34dd3eSStefano Zampini     /* global: \widetilde{B0}_B w_\Gamma */
8609fa34dd3eSStefano Zampini     if (zerodiag) {
8610fa34dd3eSStefano Zampini       ierr = MatMult(B0_B,pcis->vec2_B,dummy_vec);CHKERRQ(ierr);
8611fa34dd3eSStefano Zampini       ierr = VecGetArray(dummy_vec,&array);CHKERRQ(ierr);
86124f1b2e48SStefano Zampini       for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = array[i];
8613fa34dd3eSStefano Zampini       ierr = VecRestoreArray(dummy_vec,&array);CHKERRQ(ierr);
8614fa34dd3eSStefano Zampini     }
8615fa34dd3eSStefano Zampini     /* BDDC */
8616fa34dd3eSStefano Zampini     ierr = VecSet(pcis->vec1_D,0.);CHKERRQ(ierr);
8617fa34dd3eSStefano Zampini     ierr = PCBDDCApplyInterfacePreconditioner(pc,PETSC_FALSE);CHKERRQ(ierr);
8618fa34dd3eSStefano Zampini 
8619fa34dd3eSStefano Zampini     ierr = VecCopy(pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
8620fa34dd3eSStefano Zampini     ierr = VecAXPY(pcis->vec1_B,-1.0,vec_check_B);CHKERRQ(ierr);
8621fa34dd3eSStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&norm);CHKERRQ(ierr);
8622fa34dd3eSStefano Zampini     PetscPrintf(PETSC_COMM_SELF,"[%d] BDDC local error is %1.4e\n",PetscGlobalRank,norm);
86234f1b2e48SStefano Zampini     for (i=0;i<pcbddc->benign_n;i++) {
86244f1b2e48SStefano Zampini       PetscPrintf(PETSC_COMM_SELF,"[%d] BDDC p0[%d] error is %1.4e\n",PetscGlobalRank,i,PetscAbsScalar(pcbddc->benign_p0[i]-p0_check[i]));
8625fa34dd3eSStefano Zampini     }
86264f1b2e48SStefano Zampini     ierr = PetscFree(p0_check);CHKERRQ(ierr);
8627fa34dd3eSStefano Zampini     ierr = VecDestroy(&vec_scale_P);CHKERRQ(ierr);
8628fa34dd3eSStefano Zampini     ierr = VecDestroy(&vec_check_B);CHKERRQ(ierr);
8629fa34dd3eSStefano Zampini     ierr = VecDestroy(&dummy_vec);CHKERRQ(ierr);
8630fa34dd3eSStefano Zampini     ierr = MatDestroy(&S_j);CHKERRQ(ierr);
8631fa34dd3eSStefano Zampini     ierr = MatDestroy(&B0_B);CHKERRQ(ierr);
8632fa34dd3eSStefano Zampini   }
8633fa34dd3eSStefano Zampini   PetscFunctionReturn(0);
8634fa34dd3eSStefano Zampini }
86351e0482f5SStefano Zampini 
86361e0482f5SStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h>
86371e0482f5SStefano Zampini PetscErrorCode MatMPIAIJRestrict(Mat A, MPI_Comm ccomm, Mat *B)
86381e0482f5SStefano Zampini {
86391e0482f5SStefano Zampini   Mat            At;
86401e0482f5SStefano Zampini   IS             rows;
86411e0482f5SStefano Zampini   PetscInt       rst,ren;
86421e0482f5SStefano Zampini   PetscErrorCode ierr;
86431e0482f5SStefano Zampini   PetscLayout    rmap;
86441e0482f5SStefano Zampini 
86451e0482f5SStefano Zampini   PetscFunctionBegin;
86461e0482f5SStefano Zampini   rst = ren = 0;
86471e0482f5SStefano Zampini   if (ccomm != MPI_COMM_NULL) {
86481e0482f5SStefano Zampini     ierr = PetscLayoutCreate(ccomm,&rmap);CHKERRQ(ierr);
86491e0482f5SStefano Zampini     ierr = PetscLayoutSetSize(rmap,A->rmap->N);CHKERRQ(ierr);
86501e0482f5SStefano Zampini     ierr = PetscLayoutSetBlockSize(rmap,1);CHKERRQ(ierr);
86511e0482f5SStefano Zampini     ierr = PetscLayoutSetUp(rmap);CHKERRQ(ierr);
86521e0482f5SStefano Zampini     ierr = PetscLayoutGetRange(rmap,&rst,&ren);CHKERRQ(ierr);
86531e0482f5SStefano Zampini   }
8654e07686f2SStefano Zampini   ierr = ISCreateStride(PetscObjectComm((PetscObject)A),ren-rst,rst,1,&rows);CHKERRQ(ierr);
86557dae84e0SHong Zhang   ierr = MatCreateSubMatrix(A,rows,NULL,MAT_INITIAL_MATRIX,&At);CHKERRQ(ierr);
86561e0482f5SStefano Zampini   ierr = ISDestroy(&rows);CHKERRQ(ierr);
86571e0482f5SStefano Zampini 
86581e0482f5SStefano Zampini   if (ccomm != MPI_COMM_NULL) {
86591e0482f5SStefano Zampini     Mat_MPIAIJ *a,*b;
86601e0482f5SStefano Zampini     IS         from,to;
86611e0482f5SStefano Zampini     Vec        gvec;
86621e0482f5SStefano Zampini     PetscInt   lsize;
86631e0482f5SStefano Zampini 
86641e0482f5SStefano Zampini     ierr = MatCreate(ccomm,B);CHKERRQ(ierr);
86651e0482f5SStefano Zampini     ierr = MatSetSizes(*B,ren-rst,PETSC_DECIDE,PETSC_DECIDE,At->cmap->N);CHKERRQ(ierr);
86661e0482f5SStefano Zampini     ierr = MatSetType(*B,MATAIJ);CHKERRQ(ierr);
86671e0482f5SStefano Zampini     ierr = PetscLayoutDestroy(&((*B)->rmap));CHKERRQ(ierr);
86681e0482f5SStefano Zampini     ierr = PetscLayoutSetUp((*B)->cmap);CHKERRQ(ierr);
86691e0482f5SStefano Zampini     a    = (Mat_MPIAIJ*)At->data;
86701e0482f5SStefano Zampini     b    = (Mat_MPIAIJ*)(*B)->data;
86711e0482f5SStefano Zampini     ierr = MPI_Comm_size(ccomm,&b->size);CHKERRQ(ierr);
86721e0482f5SStefano Zampini     ierr = MPI_Comm_rank(ccomm,&b->rank);CHKERRQ(ierr);
86731e0482f5SStefano Zampini     ierr = PetscObjectReference((PetscObject)a->A);CHKERRQ(ierr);
86741e0482f5SStefano Zampini     ierr = PetscObjectReference((PetscObject)a->B);CHKERRQ(ierr);
86751e0482f5SStefano Zampini     b->A = a->A;
86761e0482f5SStefano Zampini     b->B = a->B;
86771e0482f5SStefano Zampini 
86781e0482f5SStefano Zampini     b->donotstash      = a->donotstash;
86791e0482f5SStefano Zampini     b->roworiented     = a->roworiented;
86801e0482f5SStefano Zampini     b->rowindices      = 0;
86811e0482f5SStefano Zampini     b->rowvalues       = 0;
86821e0482f5SStefano Zampini     b->getrowactive    = PETSC_FALSE;
86831e0482f5SStefano Zampini 
86841e0482f5SStefano Zampini     (*B)->rmap         = rmap;
86851e0482f5SStefano Zampini     (*B)->factortype   = A->factortype;
86861e0482f5SStefano Zampini     (*B)->assembled    = PETSC_TRUE;
86871e0482f5SStefano Zampini     (*B)->insertmode   = NOT_SET_VALUES;
86881e0482f5SStefano Zampini     (*B)->preallocated = PETSC_TRUE;
86891e0482f5SStefano Zampini 
86901e0482f5SStefano Zampini     if (a->colmap) {
86911e0482f5SStefano Zampini #if defined(PETSC_USE_CTABLE)
86921e0482f5SStefano Zampini       ierr = PetscTableCreateCopy(a->colmap,&b->colmap);CHKERRQ(ierr);
86931e0482f5SStefano Zampini #else
86941e0482f5SStefano Zampini       ierr = PetscMalloc1(At->cmap->N,&b->colmap);CHKERRQ(ierr);
86951e0482f5SStefano Zampini       ierr = PetscLogObjectMemory((PetscObject)*B,At->cmap->N*sizeof(PetscInt));CHKERRQ(ierr);
86961e0482f5SStefano Zampini       ierr = PetscMemcpy(b->colmap,a->colmap,At->cmap->N*sizeof(PetscInt));CHKERRQ(ierr);
86971e0482f5SStefano Zampini #endif
86981e0482f5SStefano Zampini     } else b->colmap = 0;
86991e0482f5SStefano Zampini     if (a->garray) {
87001e0482f5SStefano Zampini       PetscInt len;
87011e0482f5SStefano Zampini       len  = a->B->cmap->n;
87021e0482f5SStefano Zampini       ierr = PetscMalloc1(len+1,&b->garray);CHKERRQ(ierr);
87031e0482f5SStefano Zampini       ierr = PetscLogObjectMemory((PetscObject)(*B),len*sizeof(PetscInt));CHKERRQ(ierr);
87041e0482f5SStefano Zampini       if (len) { ierr = PetscMemcpy(b->garray,a->garray,len*sizeof(PetscInt));CHKERRQ(ierr); }
87051e0482f5SStefano Zampini     } else b->garray = 0;
87061e0482f5SStefano Zampini 
87071e0482f5SStefano Zampini     ierr    = PetscObjectReference((PetscObject)a->lvec);CHKERRQ(ierr);
87081e0482f5SStefano Zampini     b->lvec = a->lvec;
87091e0482f5SStefano Zampini     ierr    = PetscLogObjectParent((PetscObject)*B,(PetscObject)b->lvec);CHKERRQ(ierr);
87101e0482f5SStefano Zampini 
87111e0482f5SStefano Zampini     /* cannot use VecScatterCopy */
87121e0482f5SStefano Zampini     ierr = VecGetLocalSize(b->lvec,&lsize);CHKERRQ(ierr);
87131e0482f5SStefano Zampini     ierr = ISCreateGeneral(ccomm,lsize,b->garray,PETSC_USE_POINTER,&from);CHKERRQ(ierr);
87141e0482f5SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,lsize,0,1,&to);CHKERRQ(ierr);
87151e0482f5SStefano Zampini     ierr = MatCreateVecs(*B,&gvec,NULL);CHKERRQ(ierr);
87161e0482f5SStefano Zampini     ierr = VecScatterCreate(gvec,from,b->lvec,to,&b->Mvctx);CHKERRQ(ierr);
87171e0482f5SStefano Zampini     ierr = PetscLogObjectParent((PetscObject)*B,(PetscObject)b->Mvctx);CHKERRQ(ierr);
87181e0482f5SStefano Zampini     ierr = ISDestroy(&from);CHKERRQ(ierr);
87191e0482f5SStefano Zampini     ierr = ISDestroy(&to);CHKERRQ(ierr);
87201e0482f5SStefano Zampini     ierr = VecDestroy(&gvec);CHKERRQ(ierr);
87211e0482f5SStefano Zampini   }
87221e0482f5SStefano Zampini   ierr = MatDestroy(&At);CHKERRQ(ierr);
87231e0482f5SStefano Zampini   PetscFunctionReturn(0);
87241e0482f5SStefano Zampini }
8725