11cf9b237SStefano Zampini #include <../src/mat/impls/aij/seq/aij.h> 2ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddc.h> 3ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddcprivate.h> 4c80a6c00SStefano Zampini #include <petscdmplex.h> 5674ae819SStefano Zampini #include <petscblaslapack.h> 6daf8a457SStefano Zampini #include <petsc/private/sfimpl.h> 7c80a6c00SStefano Zampini #include <petsc/private/dmpleximpl.h> 8674ae819SStefano Zampini 91e0482f5SStefano Zampini static PetscErrorCode MatMPIAIJRestrict(Mat,MPI_Comm,Mat*); 101e0482f5SStefano Zampini 11f498cd09SStefano Zampini /* if range is true, it returns B s.t. span{B} = range(A) 12f498cd09SStefano Zampini if range is false, it returns B s.t. range(B) _|_ range(A) */ 13f498cd09SStefano Zampini PetscErrorCode MatDenseOrthogonalRangeOrComplement(Mat A, PetscBool range, PetscInt lw, PetscScalar *work, PetscReal *rwork, Mat *B) 14a13144ffSStefano Zampini { 15a13144ffSStefano Zampini #if !defined(PETSC_USE_COMPLEX) 16a13144ffSStefano Zampini PetscScalar *uwork,*data,*U, ds = 0.; 17a13144ffSStefano Zampini PetscReal *sing; 18a13144ffSStefano Zampini PetscBLASInt bM,bN,lwork,lierr,di = 1; 19a13144ffSStefano Zampini PetscInt ulw,i,nr,nc,n; 20a13144ffSStefano Zampini PetscErrorCode ierr; 21a13144ffSStefano Zampini 22a13144ffSStefano Zampini PetscFunctionBegin; 23a13144ffSStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 24a13144ffSStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"LAPACK _GESVD not available"); 25614dbb09SStefano Zampini #else 26a13144ffSStefano Zampini ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr); 27a13144ffSStefano Zampini if (!nr || !nc) PetscFunctionReturn(0); 28a13144ffSStefano Zampini 29a13144ffSStefano Zampini /* workspace */ 30a13144ffSStefano Zampini if (!work) { 31a13144ffSStefano Zampini ulw = PetscMax(PetscMax(1,5*PetscMin(nr,nc)),3*PetscMin(nr,nc)+PetscMax(nr,nc)); 32f913dca9SStefano Zampini ierr = PetscMalloc1(ulw,&uwork);CHKERRQ(ierr); 33a13144ffSStefano Zampini } else { 34a13144ffSStefano Zampini ulw = lw; 35a13144ffSStefano Zampini uwork = work; 36a13144ffSStefano Zampini } 37a13144ffSStefano Zampini n = PetscMin(nr,nc); 38a13144ffSStefano Zampini if (!rwork) { 39a13144ffSStefano Zampini ierr = PetscMalloc1(n,&sing);CHKERRQ(ierr); 40a13144ffSStefano Zampini } else { 41a13144ffSStefano Zampini sing = rwork; 42a13144ffSStefano Zampini } 43a13144ffSStefano Zampini 44a13144ffSStefano Zampini /* SVD */ 45a13144ffSStefano Zampini ierr = PetscMalloc1(nr*nr,&U);CHKERRQ(ierr); 46a13144ffSStefano Zampini ierr = PetscBLASIntCast(nr,&bM);CHKERRQ(ierr); 47a13144ffSStefano Zampini ierr = PetscBLASIntCast(nc,&bN);CHKERRQ(ierr); 48a13144ffSStefano Zampini ierr = PetscBLASIntCast(ulw,&lwork);CHKERRQ(ierr); 49a13144ffSStefano Zampini ierr = MatDenseGetArray(A,&data);CHKERRQ(ierr); 50a13144ffSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 51a13144ffSStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("A","N",&bM,&bN,data,&bM,sing,U,&bM,&ds,&di,uwork,&lwork,&lierr)); 52a13144ffSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 53a13144ffSStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESVD Lapack routine %d",(int)lierr); 54a13144ffSStefano Zampini ierr = MatDenseRestoreArray(A,&data);CHKERRQ(ierr); 55a13144ffSStefano Zampini for (i=0;i<n;i++) if (sing[i] < PETSC_SMALL) break; 56a13144ffSStefano Zampini if (!rwork) { 57a13144ffSStefano Zampini ierr = PetscFree(sing);CHKERRQ(ierr); 58a13144ffSStefano Zampini } 59a13144ffSStefano Zampini if (!work) { 60a13144ffSStefano Zampini ierr = PetscFree(uwork);CHKERRQ(ierr); 61a13144ffSStefano Zampini } 62a13144ffSStefano Zampini /* create B */ 63f498cd09SStefano Zampini if (!range) { 64a13144ffSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,nr,nr-i,NULL,B);CHKERRQ(ierr); 65a13144ffSStefano Zampini ierr = MatDenseGetArray(*B,&data);CHKERRQ(ierr); 66a13144ffSStefano Zampini ierr = PetscMemcpy(data,U+nr*i,(nr-i)*nr*sizeof(PetscScalar));CHKERRQ(ierr); 67f498cd09SStefano Zampini } else { 68f498cd09SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,nr,i,NULL,B);CHKERRQ(ierr); 69f498cd09SStefano Zampini ierr = MatDenseGetArray(*B,&data);CHKERRQ(ierr); 70f498cd09SStefano Zampini ierr = PetscMemcpy(data,U,i*nr*sizeof(PetscScalar));CHKERRQ(ierr); 71f498cd09SStefano Zampini } 72a13144ffSStefano Zampini ierr = MatDenseRestoreArray(*B,&data);CHKERRQ(ierr); 73a13144ffSStefano Zampini ierr = PetscFree(U);CHKERRQ(ierr); 74614dbb09SStefano Zampini #endif 75614dbb09SStefano Zampini #else /* PETSC_USE_COMPLEX */ 76a13144ffSStefano Zampini PetscFunctionBegin; 77a13144ffSStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented for complexes"); 78a13144ffSStefano Zampini #endif 79a13144ffSStefano Zampini PetscFunctionReturn(0); 80a13144ffSStefano Zampini } 81a13144ffSStefano Zampini 821e0482f5SStefano Zampini /* TODO REMOVE */ 831e0482f5SStefano Zampini #if defined(PRINT_GDET) 841e0482f5SStefano Zampini static int inc = 0; 851e0482f5SStefano Zampini static int lev = 0; 861e0482f5SStefano Zampini #endif 871e0482f5SStefano Zampini 881e0482f5SStefano Zampini PetscErrorCode PCBDDCComputeNedelecChangeEdge(Mat lG, IS edge, IS extrow, IS extcol, IS corners, Mat* Gins, Mat* GKins, PetscScalar cvals[2], PetscScalar *work, PetscReal *rwork) 89a13144ffSStefano Zampini { 90a13144ffSStefano Zampini PetscErrorCode ierr; 91a13144ffSStefano Zampini Mat GE,GEd; 92a13144ffSStefano Zampini PetscInt rsize,csize,esize; 93a13144ffSStefano Zampini PetscScalar *ptr; 94a13144ffSStefano Zampini 95a13144ffSStefano Zampini PetscFunctionBegin; 96a13144ffSStefano Zampini ierr = ISGetSize(edge,&esize);CHKERRQ(ierr); 97c3c0e390SStefano Zampini if (!esize) PetscFunctionReturn(0); 98a13144ffSStefano Zampini ierr = ISGetSize(extrow,&rsize);CHKERRQ(ierr); 99a13144ffSStefano Zampini ierr = ISGetSize(extcol,&csize);CHKERRQ(ierr); 100a13144ffSStefano Zampini 101a13144ffSStefano Zampini /* gradients */ 102a13144ffSStefano Zampini ptr = work + 5*esize; 1037dae84e0SHong Zhang ierr = MatCreateSubMatrix(lG,extrow,extcol,MAT_INITIAL_MATRIX,&GE);CHKERRQ(ierr); 104a13144ffSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,rsize,csize,ptr,Gins);CHKERRQ(ierr); 105a13144ffSStefano Zampini ierr = MatConvert(GE,MATSEQDENSE,MAT_REUSE_MATRIX,Gins);CHKERRQ(ierr); 106a13144ffSStefano Zampini ierr = MatDestroy(&GE);CHKERRQ(ierr); 107a13144ffSStefano Zampini 108a13144ffSStefano Zampini /* constants */ 109a13144ffSStefano Zampini ptr += rsize*csize; 110a13144ffSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,esize,csize,ptr,&GEd);CHKERRQ(ierr); 1117dae84e0SHong Zhang ierr = MatCreateSubMatrix(lG,edge,extcol,MAT_INITIAL_MATRIX,&GE);CHKERRQ(ierr); 112a13144ffSStefano Zampini ierr = MatConvert(GE,MATSEQDENSE,MAT_REUSE_MATRIX,&GEd);CHKERRQ(ierr); 113a13144ffSStefano Zampini ierr = MatDestroy(&GE);CHKERRQ(ierr); 114f498cd09SStefano Zampini ierr = MatDenseOrthogonalRangeOrComplement(GEd,PETSC_FALSE,5*esize,work,rwork,GKins);CHKERRQ(ierr); 115a13144ffSStefano Zampini ierr = MatDestroy(&GEd);CHKERRQ(ierr); 1161e0482f5SStefano Zampini 1171e0482f5SStefano Zampini if (corners) { 1181e0482f5SStefano Zampini Mat GEc; 1191e0482f5SStefano Zampini PetscScalar *vals,v; 1201e0482f5SStefano Zampini 1217dae84e0SHong Zhang ierr = MatCreateSubMatrix(lG,edge,corners,MAT_INITIAL_MATRIX,&GEc);CHKERRQ(ierr); 1221e0482f5SStefano Zampini ierr = MatTransposeMatMult(GEc,*GKins,MAT_INITIAL_MATRIX,1.0,&GEd);CHKERRQ(ierr); 1231e0482f5SStefano Zampini ierr = MatDenseGetArray(GEd,&vals);CHKERRQ(ierr); 124637e8532SStefano Zampini /* v = PetscAbsScalar(vals[0]) */; 125637e8532SStefano Zampini v = 1.; 1261e0482f5SStefano Zampini cvals[0] = vals[0]/v; 1271e0482f5SStefano Zampini cvals[1] = vals[1]/v; 1281e0482f5SStefano Zampini ierr = MatDenseRestoreArray(GEd,&vals);CHKERRQ(ierr); 1291e0482f5SStefano Zampini ierr = MatScale(*GKins,1./v);CHKERRQ(ierr); 1301e0482f5SStefano Zampini #if defined(PRINT_GDET) 1311e0482f5SStefano Zampini { 1321e0482f5SStefano Zampini PetscViewer viewer; 1331e0482f5SStefano Zampini char filename[256]; 1341e0482f5SStefano Zampini sprintf(filename,"Gdet_l%d_r%d_cc%d.m",lev,PetscGlobalRank,inc++); 1351e0482f5SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&viewer);CHKERRQ(ierr); 1361e0482f5SStefano Zampini ierr = PetscViewerPushFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 1371e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)GEc,"GEc");CHKERRQ(ierr); 1381e0482f5SStefano Zampini ierr = MatView(GEc,viewer);CHKERRQ(ierr); 1391e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)(*GKins),"GK");CHKERRQ(ierr); 1401e0482f5SStefano Zampini ierr = MatView(*GKins,viewer);CHKERRQ(ierr); 1411e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)GEd,"Gproj");CHKERRQ(ierr); 1421e0482f5SStefano Zampini ierr = MatView(GEd,viewer);CHKERRQ(ierr); 1431e0482f5SStefano Zampini ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 1441e0482f5SStefano Zampini } 1451e0482f5SStefano Zampini #endif 1461e0482f5SStefano Zampini ierr = MatDestroy(&GEd);CHKERRQ(ierr); 1471e0482f5SStefano Zampini ierr = MatDestroy(&GEc);CHKERRQ(ierr); 1481e0482f5SStefano Zampini } 1491e0482f5SStefano Zampini 150a13144ffSStefano Zampini PetscFunctionReturn(0); 151a13144ffSStefano Zampini } 152a13144ffSStefano Zampini 153a13144ffSStefano Zampini PetscErrorCode PCBDDCNedelecSupport(PC pc) 154a13144ffSStefano Zampini { 155a13144ffSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 156a13144ffSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 1570569b399SStefano Zampini Mat G,T,conn,lG,lGt,lGis,lGall,lGe,lGinit; 158eee23b56SStefano Zampini Vec tvec; 159a13144ffSStefano Zampini PetscSF sfv; 1601e0482f5SStefano Zampini ISLocalToGlobalMapping el2g,vl2g,fl2g,al2g; 161a13144ffSStefano Zampini MPI_Comm comm; 162c2151214SStefano Zampini IS lned,primals,allprimals,nedfieldlocal; 163c2151214SStefano Zampini IS *eedges,*extrows,*extcols,*alleedges; 1647d871cd7SStefano Zampini PetscBT btv,bte,btvc,btb,btbd,btvcand,btvi,btee,bter; 165a13144ffSStefano Zampini PetscScalar *vals,*work; 166a13144ffSStefano Zampini PetscReal *rwork; 167a13144ffSStefano Zampini const PetscInt *idxs,*ii,*jj,*iit,*jjt; 1681e0482f5SStefano Zampini PetscInt ne,nv,Lv,order,n,field; 169a13144ffSStefano Zampini PetscInt n_neigh,*neigh,*n_shared,**shared; 170eee23b56SStefano Zampini PetscInt i,j,extmem,cum,maxsize,nee; 171b03ebc13SStefano Zampini PetscInt *extrow,*extrowcum,*marks,*vmarks,*gidxs; 172a13144ffSStefano Zampini PetscInt *sfvleaves,*sfvroots; 173b03ebc13SStefano Zampini PetscInt *corners,*cedges; 174637e8532SStefano Zampini PetscInt *ecount,**eneighs,*vcount,**vneighs; 175b03ebc13SStefano Zampini #if defined(PETSC_USE_DEBUG) 176b03ebc13SStefano Zampini PetscInt *emarks; 177b03ebc13SStefano Zampini #endif 178213b8bfaSStefano Zampini PetscBool print,eerr,done,lrc[2],conforming,global,singular,setprimal; 179a13144ffSStefano Zampini PetscErrorCode ierr; 180a13144ffSStefano Zampini 181a13144ffSStefano Zampini PetscFunctionBegin; 182213b8bfaSStefano Zampini /* If the discrete gradient is defined for a subset of dofs and global is true, 183213b8bfaSStefano Zampini it assumes G is given in global ordering for all the dofs. 184213b8bfaSStefano Zampini Otherwise, the ordering is global for the Nedelec field */ 185213b8bfaSStefano Zampini order = pcbddc->nedorder; 186213b8bfaSStefano Zampini conforming = pcbddc->conforming; 187213b8bfaSStefano Zampini field = pcbddc->nedfield; 188213b8bfaSStefano Zampini global = pcbddc->nedglobal; 189213b8bfaSStefano Zampini setprimal = PETSC_FALSE; 190a13144ffSStefano Zampini print = PETSC_FALSE; 191213b8bfaSStefano Zampini singular = PETSC_FALSE; 192a13144ffSStefano Zampini 193213b8bfaSStefano Zampini /* Command line customization */ 194213b8bfaSStefano Zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC Nedelec options","PC");CHKERRQ(ierr); 195213b8bfaSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_nedelec_field_primal","All edge dofs set as primals: Toselli's algorithm C",NULL,setprimal,&setprimal,NULL);CHKERRQ(ierr); 196213b8bfaSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_nedelec_singular","Infer nullspace from discrete gradient",NULL,singular,&singular,NULL);CHKERRQ(ierr); 197213b8bfaSStefano Zampini ierr = PetscOptionsInt("-pc_bddc_nedelec_order","Test variable order code (to be removed)",NULL,order,&order,NULL);CHKERRQ(ierr); 198213b8bfaSStefano Zampini /* print debug info TODO: to be removed */ 199213b8bfaSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_nedelec_print","Print debug info",NULL,print,&print,NULL);CHKERRQ(ierr); 200213b8bfaSStefano Zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 201213b8bfaSStefano Zampini 202213b8bfaSStefano Zampini /* Return if there are no edges in the decomposition and the problem is not singular */ 2031e0482f5SStefano Zampini ierr = MatGetLocalToGlobalMapping(pc->pmat,&al2g,NULL);CHKERRQ(ierr); 2041e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingGetSize(al2g,&n);CHKERRQ(ierr); 205213b8bfaSStefano Zampini ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 206213b8bfaSStefano Zampini if (!singular) { 207a13144ffSStefano Zampini ierr = VecGetArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 208a13144ffSStefano Zampini lrc[0] = PETSC_FALSE; 209c2151214SStefano Zampini for (i=0;i<n;i++) { 210a13144ffSStefano Zampini if (PetscRealPart(vals[i]) > 2.) { 211a13144ffSStefano Zampini lrc[0] = PETSC_TRUE; 212a13144ffSStefano Zampini break; 213a13144ffSStefano Zampini } 214a13144ffSStefano Zampini } 215a13144ffSStefano Zampini ierr = VecRestoreArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 216a13144ffSStefano Zampini ierr = MPIU_Allreduce(&lrc[0],&lrc[1],1,MPIU_BOOL,MPI_LOR,comm);CHKERRQ(ierr); 217a13144ffSStefano Zampini if (!lrc[1]) PetscFunctionReturn(0); 218213b8bfaSStefano Zampini } 219a13144ffSStefano Zampini 220213b8bfaSStefano Zampini /* Get Nedelec field */ 221213b8bfaSStefano Zampini ierr = MatISSetUpSF(pc->pmat);CHKERRQ(ierr); 222c2151214SStefano Zampini if (pcbddc->n_ISForDofsLocal && field >= pcbddc->n_ISForDofsLocal) SETERRQ2(comm,PETSC_ERR_USER,"Invalid field for Nedelec %d: number of fields is %d",field,pcbddc->n_ISForDofsLocal); 223213b8bfaSStefano Zampini if (pcbddc->n_ISForDofsLocal && field >= 0) { 224c2151214SStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ISForDofsLocal[field]);CHKERRQ(ierr); 225c2151214SStefano Zampini nedfieldlocal = pcbddc->ISForDofsLocal[field]; 226c2151214SStefano Zampini ierr = ISGetLocalSize(nedfieldlocal,&ne);CHKERRQ(ierr); 227213b8bfaSStefano Zampini } else if (!pcbddc->n_ISForDofsLocal && field != PETSC_DECIDE) { 228213b8bfaSStefano Zampini ne = n; 229213b8bfaSStefano Zampini nedfieldlocal = NULL; 230213b8bfaSStefano Zampini global = PETSC_TRUE; 231213b8bfaSStefano Zampini } else if (field == PETSC_DECIDE) { 232213b8bfaSStefano Zampini PetscInt rst,ren,*idx; 233213b8bfaSStefano Zampini 234213b8bfaSStefano Zampini ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscInt));CHKERRQ(ierr); 235213b8bfaSStefano Zampini ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 236213b8bfaSStefano Zampini ierr = MatGetOwnershipRange(pcbddc->discretegradient,&rst,&ren);CHKERRQ(ierr); 237213b8bfaSStefano Zampini for (i=rst;i<ren;i++) { 238213b8bfaSStefano Zampini PetscInt nc; 239213b8bfaSStefano Zampini 240213b8bfaSStefano Zampini ierr = MatGetRow(pcbddc->discretegradient,i,&nc,NULL,NULL);CHKERRQ(ierr); 241213b8bfaSStefano Zampini if (nc > 1) matis->sf_rootdata[i-rst] = 1; 242213b8bfaSStefano Zampini ierr = MatRestoreRow(pcbddc->discretegradient,i,&nc,NULL,NULL);CHKERRQ(ierr); 243213b8bfaSStefano Zampini } 244213b8bfaSStefano Zampini ierr = PetscSFBcastBegin(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 245213b8bfaSStefano Zampini ierr = PetscSFBcastEnd(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 246213b8bfaSStefano Zampini ierr = PetscMalloc1(n,&idx);CHKERRQ(ierr); 247213b8bfaSStefano Zampini for (i=0,ne=0;i<n;i++) if (matis->sf_leafdata[i]) idx[ne++] = i; 248213b8bfaSStefano Zampini ierr = ISCreateGeneral(comm,ne,idx,PETSC_OWN_POINTER,&nedfieldlocal);CHKERRQ(ierr); 249213b8bfaSStefano Zampini } else { 250213b8bfaSStefano Zampini SETERRQ(comm,PETSC_ERR_USER,"When multiple fields are present, the Nedelec field has to be specified"); 251213b8bfaSStefano Zampini } 252213b8bfaSStefano Zampini 253213b8bfaSStefano Zampini /* Sanity checks */ 254213b8bfaSStefano Zampini if (!order && !conforming) SETERRQ(comm,PETSC_ERR_SUP,"Variable order and non-conforming spaces are not supported at the same time"); 255213b8bfaSStefano Zampini if (pcbddc->user_ChangeOfBasisMatrix) SETERRQ(comm,PETSC_ERR_SUP,"Cannot generate Nedelec support with user defined change of basis"); 256213b8bfaSStefano Zampini if (order && ne%order) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"The number of local edge dofs %d it's not a multiple of the order %d",ne,order); 257213b8bfaSStefano Zampini 258213b8bfaSStefano Zampini /* Just set primal dofs and return */ 2591e0482f5SStefano Zampini if (setprimal) { 260eee23b56SStefano Zampini IS enedfieldlocal; 261eee23b56SStefano Zampini PetscInt *eidxs; 262eee23b56SStefano Zampini 263eee23b56SStefano Zampini ierr = PetscMalloc1(ne,&eidxs);CHKERRQ(ierr); 264eee23b56SStefano Zampini ierr = VecGetArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 265213b8bfaSStefano Zampini if (nedfieldlocal) { 266213b8bfaSStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 267eee23b56SStefano Zampini for (i=0,cum=0;i<ne;i++) { 268eee23b56SStefano Zampini if (PetscRealPart(vals[idxs[i]]) > 2.) { 269eee23b56SStefano Zampini eidxs[cum++] = idxs[i]; 270eee23b56SStefano Zampini } 271eee23b56SStefano Zampini } 272eee23b56SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 273213b8bfaSStefano Zampini } else { 274213b8bfaSStefano Zampini for (i=0,cum=0;i<ne;i++) { 275213b8bfaSStefano Zampini if (PetscRealPart(vals[i]) > 2.) { 276213b8bfaSStefano Zampini eidxs[cum++] = i; 277213b8bfaSStefano Zampini } 278213b8bfaSStefano Zampini } 279213b8bfaSStefano Zampini } 280213b8bfaSStefano Zampini ierr = VecRestoreArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 281eee23b56SStefano Zampini ierr = ISCreateGeneral(comm,cum,eidxs,PETSC_COPY_VALUES,&enedfieldlocal);CHKERRQ(ierr); 282eee23b56SStefano Zampini ierr = PCBDDCSetPrimalVerticesLocalIS(pc,enedfieldlocal);CHKERRQ(ierr); 283eee23b56SStefano Zampini ierr = PetscFree(eidxs);CHKERRQ(ierr); 2841e0482f5SStefano Zampini ierr = ISDestroy(&nedfieldlocal);CHKERRQ(ierr); 285eee23b56SStefano Zampini ierr = ISDestroy(&enedfieldlocal);CHKERRQ(ierr); 2861e0482f5SStefano Zampini PetscFunctionReturn(0); 2871e0482f5SStefano Zampini } 288a13144ffSStefano Zampini 289213b8bfaSStefano Zampini /* Compute some l2g maps */ 290213b8bfaSStefano Zampini if (nedfieldlocal) { 291c2151214SStefano Zampini IS is; 292c2151214SStefano Zampini 293c2151214SStefano Zampini /* need to map from the local Nedelec field to local numbering */ 294c2151214SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(nedfieldlocal,&fl2g);CHKERRQ(ierr); 2951e0482f5SStefano Zampini /* need to map from the local Nedelec field to global numbering for the whole dofs*/ 2961e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(al2g,nedfieldlocal,&is);CHKERRQ(ierr); 2971e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is,&al2g);CHKERRQ(ierr); 2981e0482f5SStefano Zampini /* need to map from the local Nedelec field to global numbering (for Nedelec only) */ 2991e0482f5SStefano Zampini if (global) { 3001e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr); 3011e0482f5SStefano Zampini el2g = al2g; 3021e0482f5SStefano Zampini } else { 3031e0482f5SStefano Zampini IS gis; 3041e0482f5SStefano Zampini 3051e0482f5SStefano Zampini ierr = ISRenumber(is,NULL,NULL,&gis);CHKERRQ(ierr); 3061e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(gis,&el2g);CHKERRQ(ierr); 3071e0482f5SStefano Zampini ierr = ISDestroy(&gis);CHKERRQ(ierr); 3081e0482f5SStefano Zampini } 309c2151214SStefano Zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 310c2151214SStefano Zampini } else { 3111e0482f5SStefano Zampini /* restore default */ 3121e0482f5SStefano Zampini pcbddc->nedfield = -1; 3131e0482f5SStefano Zampini /* one ref for the destruction of al2g, one for el2g */ 3141e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr); 3151e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr); 3161e0482f5SStefano Zampini el2g = al2g; 317c2151214SStefano Zampini fl2g = NULL; 318c2151214SStefano Zampini } 319a13144ffSStefano Zampini 320213b8bfaSStefano Zampini /* Start communication to drop connections for interior edges (for cc analysis only) */ 321c2151214SStefano Zampini ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscInt));CHKERRQ(ierr); 322c2151214SStefano Zampini ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 323c2151214SStefano Zampini if (nedfieldlocal) { 324c2151214SStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 325c2151214SStefano Zampini for (i=0;i<ne;i++) matis->sf_leafdata[idxs[i]] = 1; 326c2151214SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 327c2151214SStefano Zampini } else { 328c2151214SStefano Zampini for (i=0;i<ne;i++) matis->sf_leafdata[i] = 1; 329c2151214SStefano Zampini } 330c2151214SStefano Zampini ierr = PetscSFReduceBegin(matis->sf,MPIU_INT,matis->sf_leafdata,matis->sf_rootdata,MPI_SUM);CHKERRQ(ierr); 331c2151214SStefano Zampini ierr = PetscSFReduceEnd(matis->sf,MPIU_INT,matis->sf_leafdata,matis->sf_rootdata,MPI_SUM);CHKERRQ(ierr); 332213b8bfaSStefano Zampini 333213b8bfaSStefano Zampini if (!singular) { /* drop connections with interior edges to avoid unneeded communications and memory movements */ 334213b8bfaSStefano Zampini ierr = MatDuplicate(pcbddc->discretegradient,MAT_COPY_VALUES,&G);CHKERRQ(ierr); 335213b8bfaSStefano Zampini ierr = MatSetOption(G,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr); 3361e0482f5SStefano Zampini if (global) { 3371e0482f5SStefano Zampini PetscInt rst; 3381e0482f5SStefano Zampini 339c2151214SStefano Zampini ierr = MatGetOwnershipRange(G,&rst,NULL);CHKERRQ(ierr); 340c2151214SStefano Zampini for (i=0,cum=0;i<pc->pmat->rmap->n;i++) { 341c2151214SStefano Zampini if (matis->sf_rootdata[i] < 2) { 342c2151214SStefano Zampini matis->sf_rootdata[cum++] = i + rst; 343c2151214SStefano Zampini } 344c2151214SStefano Zampini } 345a13144ffSStefano Zampini ierr = MatSetOption(G,MAT_NO_OFF_PROC_ZERO_ROWS,PETSC_TRUE);CHKERRQ(ierr); 346c2151214SStefano Zampini ierr = MatZeroRows(G,cum,matis->sf_rootdata,0.,NULL,NULL);CHKERRQ(ierr); 3471e0482f5SStefano Zampini } else { 3481e0482f5SStefano Zampini PetscInt *tbz; 3491e0482f5SStefano Zampini 3501e0482f5SStefano Zampini ierr = PetscMalloc1(ne,&tbz);CHKERRQ(ierr); 3511e0482f5SStefano Zampini ierr = PetscSFBcastBegin(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 3521e0482f5SStefano Zampini ierr = PetscSFBcastEnd(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 3531e0482f5SStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 3541e0482f5SStefano Zampini for (i=0,cum=0;i<ne;i++) 3551e0482f5SStefano Zampini if (matis->sf_leafdata[idxs[i]] == 1) 3561e0482f5SStefano Zampini tbz[cum++] = i; 3571e0482f5SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 3581e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApply(el2g,cum,tbz,tbz);CHKERRQ(ierr); 3591e0482f5SStefano Zampini ierr = MatZeroRows(G,cum,tbz,0.,NULL,NULL);CHKERRQ(ierr); 3601e0482f5SStefano Zampini ierr = PetscFree(tbz);CHKERRQ(ierr); 3611e0482f5SStefano Zampini } 362213b8bfaSStefano Zampini } else { /* we need the entire G to infer the nullspace */ 363213b8bfaSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->discretegradient);CHKERRQ(ierr); 364213b8bfaSStefano Zampini G = pcbddc->discretegradient; 365213b8bfaSStefano Zampini } 366a13144ffSStefano Zampini 367a13144ffSStefano Zampini /* Extract subdomain relevant rows of G */ 368a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(el2g,&idxs);CHKERRQ(ierr); 369a13144ffSStefano Zampini ierr = ISCreateGeneral(comm,ne,idxs,PETSC_USE_POINTER,&lned);CHKERRQ(ierr); 3707dae84e0SHong Zhang ierr = MatCreateSubMatrix(G,lned,NULL,MAT_INITIAL_MATRIX,&lGall);CHKERRQ(ierr); 371a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(el2g,&idxs);CHKERRQ(ierr); 372a13144ffSStefano Zampini ierr = ISDestroy(&lned);CHKERRQ(ierr); 373a13144ffSStefano Zampini ierr = MatConvert(lGall,MATIS,MAT_INITIAL_MATRIX,&lGis);CHKERRQ(ierr); 374a13144ffSStefano Zampini ierr = MatDestroy(&lGall);CHKERRQ(ierr); 375a13144ffSStefano Zampini ierr = MatISGetLocalMat(lGis,&lG);CHKERRQ(ierr); 376a13144ffSStefano Zampini 377213b8bfaSStefano Zampini /* SF for nodal dofs communications */ 378c2151214SStefano Zampini ierr = MatGetLocalSize(G,NULL,&Lv);CHKERRQ(ierr); 379a13144ffSStefano Zampini ierr = MatGetLocalToGlobalMapping(lGis,NULL,&vl2g);CHKERRQ(ierr); 380a13144ffSStefano Zampini ierr = PetscObjectReference((PetscObject)vl2g);CHKERRQ(ierr); 381a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetSize(vl2g,&nv);CHKERRQ(ierr); 382a13144ffSStefano Zampini ierr = PetscSFCreate(comm,&sfv);CHKERRQ(ierr); 383a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(vl2g,&idxs);CHKERRQ(ierr); 384a13144ffSStefano Zampini ierr = PetscSFSetGraphLayout(sfv,lGis->cmap,nv,NULL,PETSC_OWN_POINTER,idxs);CHKERRQ(ierr); 385a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(vl2g,&idxs);CHKERRQ(ierr); 386213b8bfaSStefano Zampini i = singular ? 2 : 1; 387213b8bfaSStefano Zampini ierr = PetscMalloc2(i*nv,&sfvleaves,i*Lv,&sfvroots);CHKERRQ(ierr); 388a13144ffSStefano Zampini 3891e0482f5SStefano Zampini /* Destroy temporary G created in MATIS format and modified G */ 390213b8bfaSStefano Zampini ierr = PetscObjectReference((PetscObject)lG);CHKERRQ(ierr); 391a13144ffSStefano Zampini ierr = MatDestroy(&lGis);CHKERRQ(ierr); 392213b8bfaSStefano Zampini ierr = MatDestroy(&G);CHKERRQ(ierr); 393a13144ffSStefano Zampini 394213b8bfaSStefano Zampini if (print) { 395213b8bfaSStefano Zampini ierr = PetscObjectSetName((PetscObject)lG,"initial_lG");CHKERRQ(ierr); 396213b8bfaSStefano Zampini ierr = MatView(lG,NULL);CHKERRQ(ierr); 397213b8bfaSStefano Zampini } 398213b8bfaSStefano Zampini 399213b8bfaSStefano Zampini /* Save lG for values insertion in change of basis */ 4000569b399SStefano Zampini ierr = MatDuplicate(lG,MAT_COPY_VALUES,&lGinit);CHKERRQ(ierr); 4010569b399SStefano Zampini 402a13144ffSStefano Zampini /* Analyze the edge-nodes connections (duplicate lG) */ 4034e64d54eSstefano_zampini ierr = MatDuplicate(lG,MAT_COPY_VALUES,&lGe);CHKERRQ(ierr); 4044e64d54eSstefano_zampini ierr = MatSetOption(lGe,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr); 405a13144ffSStefano Zampini ierr = PetscBTCreate(nv,&btv);CHKERRQ(ierr); 406a13144ffSStefano Zampini ierr = PetscBTCreate(ne,&bte);CHKERRQ(ierr); 407a13144ffSStefano Zampini ierr = PetscBTCreate(ne,&btb);CHKERRQ(ierr); 4087d871cd7SStefano Zampini ierr = PetscBTCreate(ne,&btbd);CHKERRQ(ierr); 409c2151214SStefano Zampini ierr = PetscBTCreate(nv,&btvcand);CHKERRQ(ierr); 410a13144ffSStefano Zampini /* need to import the boundary specification to ensure the 411a13144ffSStefano Zampini proper detection of coarse edges' endpoints */ 412a13144ffSStefano Zampini if (pcbddc->DirichletBoundariesLocal) { 413c2151214SStefano Zampini IS is; 414c2151214SStefano Zampini 415c2151214SStefano Zampini if (fl2g) { 416c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_MASK,pcbddc->DirichletBoundariesLocal,&is);CHKERRQ(ierr); 417c2151214SStefano Zampini } else { 418c2151214SStefano Zampini is = pcbddc->DirichletBoundariesLocal; 419c2151214SStefano Zampini } 420c2151214SStefano Zampini ierr = ISGetLocalSize(is,&cum);CHKERRQ(ierr); 421c2151214SStefano Zampini ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr); 422a13144ffSStefano Zampini for (i=0;i<cum;i++) { 423a13144ffSStefano Zampini if (idxs[i] >= 0) { 424a13144ffSStefano Zampini ierr = PetscBTSet(btb,idxs[i]);CHKERRQ(ierr); 4257d871cd7SStefano Zampini ierr = PetscBTSet(btbd,idxs[i]);CHKERRQ(ierr); 426a13144ffSStefano Zampini } 427a13144ffSStefano Zampini } 428c2151214SStefano Zampini ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr); 429c2151214SStefano Zampini if (fl2g) { 430c2151214SStefano Zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 431c2151214SStefano Zampini } 432a13144ffSStefano Zampini } 433a13144ffSStefano Zampini if (pcbddc->NeumannBoundariesLocal) { 434c2151214SStefano Zampini IS is; 435c2151214SStefano Zampini 436c2151214SStefano Zampini if (fl2g) { 437c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_MASK,pcbddc->NeumannBoundariesLocal,&is);CHKERRQ(ierr); 438c2151214SStefano Zampini } else { 439c2151214SStefano Zampini is = pcbddc->NeumannBoundariesLocal; 440c2151214SStefano Zampini } 441c2151214SStefano Zampini ierr = ISGetLocalSize(is,&cum);CHKERRQ(ierr); 442c2151214SStefano Zampini ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr); 443a13144ffSStefano Zampini for (i=0;i<cum;i++) { 444a13144ffSStefano Zampini if (idxs[i] >= 0) { 445a13144ffSStefano Zampini ierr = PetscBTSet(btb,idxs[i]);CHKERRQ(ierr); 446a13144ffSStefano Zampini } 447a13144ffSStefano Zampini } 448c2151214SStefano Zampini ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr); 449c2151214SStefano Zampini if (fl2g) { 450c2151214SStefano Zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 451a13144ffSStefano Zampini } 452c2151214SStefano Zampini } 453c2151214SStefano Zampini 454213b8bfaSStefano Zampini /* Count neighs per dof */ 455637e8532SStefano Zampini ierr = PetscCalloc1(ne,&ecount);CHKERRQ(ierr); 456637e8532SStefano Zampini ierr = PetscMalloc1(ne,&eneighs);CHKERRQ(ierr); 457637e8532SStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(el2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 458637e8532SStefano Zampini for (i=1,cum=0;i<n_neigh;i++) { 459637e8532SStefano Zampini cum += n_shared[i]; 460637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 461637e8532SStefano Zampini ecount[shared[i][j]]++; 462637e8532SStefano Zampini } 463637e8532SStefano Zampini } 464637e8532SStefano Zampini if (ne) { 465637e8532SStefano Zampini ierr = PetscMalloc1(cum,&eneighs[0]);CHKERRQ(ierr); 466637e8532SStefano Zampini } 467637e8532SStefano Zampini for (i=1;i<ne;i++) eneighs[i] = eneighs[i-1] + ecount[i-1]; 468637e8532SStefano Zampini ierr = PetscMemzero(ecount,ne*sizeof(PetscInt));CHKERRQ(ierr); 469637e8532SStefano Zampini for (i=1;i<n_neigh;i++) { 470637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 471637e8532SStefano Zampini PetscInt k = shared[i][j]; 472637e8532SStefano Zampini eneighs[k][ecount[k]] = neigh[i]; 473637e8532SStefano Zampini ecount[k]++; 474637e8532SStefano Zampini } 475637e8532SStefano Zampini } 476637e8532SStefano Zampini for (i=0;i<ne;i++) { 477637e8532SStefano Zampini ierr = PetscSortRemoveDupsInt(&ecount[i],eneighs[i]);CHKERRQ(ierr); 478637e8532SStefano Zampini } 479637e8532SStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(el2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 480637e8532SStefano Zampini ierr = PetscCalloc1(nv,&vcount);CHKERRQ(ierr); 481637e8532SStefano Zampini ierr = PetscMalloc1(nv,&vneighs);CHKERRQ(ierr); 482637e8532SStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 483637e8532SStefano Zampini for (i=1,cum=0;i<n_neigh;i++) { 484637e8532SStefano Zampini cum += n_shared[i]; 485637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 486637e8532SStefano Zampini vcount[shared[i][j]]++; 487637e8532SStefano Zampini } 488637e8532SStefano Zampini } 489637e8532SStefano Zampini if (nv) { 490637e8532SStefano Zampini ierr = PetscMalloc1(cum,&vneighs[0]);CHKERRQ(ierr); 491637e8532SStefano Zampini } 492637e8532SStefano Zampini for (i=1;i<nv;i++) vneighs[i] = vneighs[i-1] + vcount[i-1]; 493637e8532SStefano Zampini ierr = PetscMemzero(vcount,nv*sizeof(PetscInt));CHKERRQ(ierr); 494637e8532SStefano Zampini for (i=1;i<n_neigh;i++) { 495637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 496637e8532SStefano Zampini PetscInt k = shared[i][j]; 497637e8532SStefano Zampini vneighs[k][vcount[k]] = neigh[i]; 498637e8532SStefano Zampini vcount[k]++; 499637e8532SStefano Zampini } 500637e8532SStefano Zampini } 501637e8532SStefano Zampini for (i=0;i<nv;i++) { 502637e8532SStefano Zampini ierr = PetscSortRemoveDupsInt(&vcount[i],vneighs[i]);CHKERRQ(ierr); 503637e8532SStefano Zampini } 504637e8532SStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 505637e8532SStefano Zampini 5067d871cd7SStefano Zampini /* need to remove coarse faces' dofs and coarse edges' dirichlet dofs 5077d871cd7SStefano Zampini for proper detection of coarse edges' endpoints */ 50862b0c6f7SStefano Zampini ierr = PetscBTCreate(ne,&btee);CHKERRQ(ierr); 50962b0c6f7SStefano Zampini for (i=0;i<ne;i++) { 5107d871cd7SStefano Zampini if ((ecount[i] > 1 && !PetscBTLookup(btbd,i)) || (ecount[i] == 1 && PetscBTLookup(btb,i))) { 51162b0c6f7SStefano Zampini ierr = PetscBTSet(btee,i);CHKERRQ(ierr); 51262b0c6f7SStefano Zampini } 51362b0c6f7SStefano Zampini } 514637e8532SStefano Zampini ierr = PetscMalloc1(ne,&marks);CHKERRQ(ierr); 51562b0c6f7SStefano Zampini if (!conforming) { 51662b0c6f7SStefano Zampini ierr = MatTranspose(lGe,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 51762b0c6f7SStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 51862b0c6f7SStefano Zampini } 5194e64d54eSstefano_zampini ierr = MatGetRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 520dec27d64SStefano Zampini ierr = MatSeqAIJGetArray(lGe,&vals);CHKERRQ(ierr); 52162b0c6f7SStefano Zampini cum = 0; 522a13144ffSStefano Zampini for (i=0;i<ne;i++) { 523dec27d64SStefano Zampini /* eliminate rows corresponding to edge dofs belonging to coarse faces */ 52462b0c6f7SStefano Zampini if (!PetscBTLookup(btee,i)) { 525a13144ffSStefano Zampini marks[cum++] = i; 526dec27d64SStefano Zampini continue; 527dec27d64SStefano Zampini } 528dec27d64SStefano Zampini /* set badly connected edge dofs as primal */ 52962b0c6f7SStefano Zampini if (!conforming) { 53062b0c6f7SStefano Zampini if (ii[i+1]-ii[i] != order + 1) { /* every row of G on the coarse edge should list order+1 nodal dofs */ 531a13144ffSStefano Zampini marks[cum++] = i; 532a13144ffSStefano Zampini ierr = PetscBTSet(bte,i);CHKERRQ(ierr); 533a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 534a13144ffSStefano Zampini ierr = PetscBTSet(btv,jj[j]);CHKERRQ(ierr); 535a13144ffSStefano Zampini } 53662b0c6f7SStefano Zampini } else { 53762b0c6f7SStefano Zampini /* every edge dofs should be connected trough a certain number of nodal dofs 53862b0c6f7SStefano Zampini to other edge dofs belonging to coarse edges 53962b0c6f7SStefano Zampini - at most 2 endpoints 54062b0c6f7SStefano Zampini - order-1 interior nodal dofs 54162b0c6f7SStefano Zampini - no undefined nodal dofs (nconn < order) 54262b0c6f7SStefano Zampini */ 54362b0c6f7SStefano Zampini PetscInt ends = 0,ints = 0, undef = 0; 54462b0c6f7SStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 54562b0c6f7SStefano Zampini PetscInt v = jj[j],k; 54662b0c6f7SStefano Zampini PetscInt nconn = iit[v+1]-iit[v]; 54762b0c6f7SStefano Zampini for (k=iit[v];k<iit[v+1];k++) if (!PetscBTLookup(btee,jjt[k])) nconn--; 54862b0c6f7SStefano Zampini if (nconn > order) ends++; 54962b0c6f7SStefano Zampini else if (nconn == order) ints++; 55062b0c6f7SStefano Zampini else undef++; 55162b0c6f7SStefano Zampini } 55262b0c6f7SStefano Zampini if (undef || ends > 2 || ints != order -1) { 55362b0c6f7SStefano Zampini marks[cum++] = i; 55462b0c6f7SStefano Zampini ierr = PetscBTSet(bte,i);CHKERRQ(ierr); 55562b0c6f7SStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 55662b0c6f7SStefano Zampini ierr = PetscBTSet(btv,jj[j]);CHKERRQ(ierr); 55762b0c6f7SStefano Zampini } 55862b0c6f7SStefano Zampini } 55962b0c6f7SStefano Zampini } 560a13144ffSStefano Zampini } 561dec27d64SStefano Zampini /* We assume the order on the element edge is ii[i+1]-ii[i]-1 */ 562dec27d64SStefano Zampini if (!order && ii[i+1] != ii[i]) { 563dec27d64SStefano Zampini PetscScalar val = 1./(ii[i+1]-ii[i]-1); 564dec27d64SStefano Zampini for (j=ii[i];j<ii[i+1];j++) vals[j] = val; 565a13144ffSStefano Zampini } 566dec27d64SStefano Zampini } 56762b0c6f7SStefano Zampini ierr = PetscBTDestroy(&btee);CHKERRQ(ierr); 568dec27d64SStefano Zampini ierr = MatSeqAIJRestoreArray(lGe,&vals);CHKERRQ(ierr); 5694e64d54eSstefano_zampini ierr = MatRestoreRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 57062b0c6f7SStefano Zampini if (!conforming) { 57162b0c6f7SStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 57262b0c6f7SStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 57362b0c6f7SStefano Zampini } 5744e64d54eSstefano_zampini ierr = MatZeroRows(lGe,cum,marks,0.,NULL,NULL);CHKERRQ(ierr); 575637e8532SStefano Zampini 576b03ebc13SStefano Zampini /* identify splitpoints and corner candidates */ 5774e64d54eSstefano_zampini ierr = MatTranspose(lGe,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 578a13144ffSStefano Zampini if (print) { 5794e64d54eSstefano_zampini ierr = PetscObjectSetName((PetscObject)lGe,"edgerestr_lG");CHKERRQ(ierr); 5804e64d54eSstefano_zampini ierr = MatView(lGe,NULL);CHKERRQ(ierr); 5814e64d54eSstefano_zampini ierr = PetscObjectSetName((PetscObject)lGt,"edgerestr_lGt");CHKERRQ(ierr); 582a13144ffSStefano Zampini ierr = MatView(lGt,NULL);CHKERRQ(ierr); 583a13144ffSStefano Zampini } 584a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 585dec27d64SStefano Zampini ierr = MatSeqAIJGetArray(lGt,&vals);CHKERRQ(ierr); 586a13144ffSStefano Zampini for (i=0;i<nv;i++) { 587637e8532SStefano Zampini PetscInt ord = order, test = ii[i+1]-ii[i], vc = vcount[i]; 5887d871cd7SStefano Zampini PetscBool sneighs = PETSC_TRUE, bdir = PETSC_FALSE; 589b03ebc13SStefano Zampini if (!order) { /* variable order */ 590dec27d64SStefano Zampini PetscReal vorder = 0.; 591dec27d64SStefano Zampini 592dec27d64SStefano Zampini for (j=ii[i];j<ii[i+1];j++) vorder += PetscRealPart(vals[j]); 593dec27d64SStefano Zampini test = PetscFloorReal(vorder+10.*PETSC_SQRT_MACHINE_EPSILON); 594dec27d64SStefano Zampini if (vorder-test > PETSC_SQRT_MACHINE_EPSILON) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected value for vorder: %g (%d)",vorder,test); 595dec27d64SStefano Zampini ord = 1; 596dec27d64SStefano Zampini } 597a13144ffSStefano Zampini #if defined(PETSC_USE_DEBUG) 598dec27d64SStefano Zampini if (test%ord) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected number of edge dofs %d connected with nodal dof %d with order %d",test,i,ord); 599a13144ffSStefano Zampini #endif 600637e8532SStefano Zampini for (j=ii[i];j<ii[i+1] && sneighs;j++) { 6017d871cd7SStefano Zampini if (PetscBTLookup(btbd,jj[j])) { 6027d871cd7SStefano Zampini bdir = PETSC_TRUE; 6037d871cd7SStefano Zampini break; 6047d871cd7SStefano Zampini } 605637e8532SStefano Zampini if (vc != ecount[jj[j]]) { 606637e8532SStefano Zampini sneighs = PETSC_FALSE; 607637e8532SStefano Zampini } else { 608637e8532SStefano Zampini PetscInt k,*vn = vneighs[i], *en = eneighs[jj[j]]; 609637e8532SStefano Zampini for (k=0;k<vc;k++) { 610637e8532SStefano Zampini if (vn[k] != en[k]) { 611637e8532SStefano Zampini sneighs = PETSC_FALSE; 612637e8532SStefano Zampini break; 613637e8532SStefano Zampini } 614637e8532SStefano Zampini } 615637e8532SStefano Zampini } 616637e8532SStefano Zampini } 6177d871cd7SStefano Zampini if (!sneighs || test >= 3*ord || bdir) { /* splitpoints */ 6187d871cd7SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"SPLITPOINT %d (%d %d %d)\n",i,!sneighs,test >= 3*ord,bdir); 619a13144ffSStefano Zampini ierr = PetscBTSet(btv,i);CHKERRQ(ierr); 620dec27d64SStefano Zampini } else if (test == ord) { 621b03ebc13SStefano Zampini if (order == 1 || (!order && ii[i+1]-ii[i] == 1)) { 622a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"ENDPOINT %d\n",i); 623a13144ffSStefano Zampini ierr = PetscBTSet(btv,i);CHKERRQ(ierr); 624a13144ffSStefano Zampini } else { 625a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"CORNER CANDIDATE %d\n",i); 626a13144ffSStefano Zampini ierr = PetscBTSet(btvcand,i);CHKERRQ(ierr); 627a13144ffSStefano Zampini } 628a13144ffSStefano Zampini } 629a13144ffSStefano Zampini } 630637e8532SStefano Zampini ierr = PetscFree(ecount);CHKERRQ(ierr); 631637e8532SStefano Zampini ierr = PetscFree(vcount);CHKERRQ(ierr); 632637e8532SStefano Zampini if (ne) { 633637e8532SStefano Zampini ierr = PetscFree(eneighs[0]);CHKERRQ(ierr); 634637e8532SStefano Zampini } 635637e8532SStefano Zampini if (nv) { 636637e8532SStefano Zampini ierr = PetscFree(vneighs[0]);CHKERRQ(ierr); 637637e8532SStefano Zampini } 638637e8532SStefano Zampini ierr = PetscFree(eneighs);CHKERRQ(ierr); 639637e8532SStefano Zampini ierr = PetscFree(vneighs);CHKERRQ(ierr); 6407d871cd7SStefano Zampini ierr = PetscBTDestroy(&btbd);CHKERRQ(ierr); 641b03ebc13SStefano Zampini 642b03ebc13SStefano Zampini /* a candidate is valid if it is connected to another candidate via a non-primal edge dof */ 643b03ebc13SStefano Zampini if (order != 1) { 644b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"INSPECTING CANDIDATES\n"); 645b03ebc13SStefano Zampini ierr = MatGetRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 646b03ebc13SStefano Zampini for (i=0;i<nv;i++) { 647b03ebc13SStefano Zampini if (PetscBTLookup(btvcand,i)) { 648b03ebc13SStefano Zampini PetscBool found = PETSC_FALSE; 649b03ebc13SStefano Zampini for (j=ii[i];j<ii[i+1] && !found;j++) { 650b03ebc13SStefano Zampini PetscInt k,e = jj[j]; 651b03ebc13SStefano Zampini if (PetscBTLookup(bte,e)) continue; 652b03ebc13SStefano Zampini for (k=iit[e];k<iit[e+1];k++) { 653b03ebc13SStefano Zampini PetscInt v = jjt[k]; 654b03ebc13SStefano Zampini if (v != i && PetscBTLookup(btvcand,v)) { 655b03ebc13SStefano Zampini found = PETSC_TRUE; 656b03ebc13SStefano Zampini break; 657b03ebc13SStefano Zampini } 658b03ebc13SStefano Zampini } 659b03ebc13SStefano Zampini } 660b03ebc13SStefano Zampini if (!found) { 661b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," CANDIDATE %d CLEARED\n",i); 662b03ebc13SStefano Zampini ierr = PetscBTClear(btvcand,i);CHKERRQ(ierr); 663b03ebc13SStefano Zampini } else { 664b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," CANDIDATE %d ACCEPTED\n",i); 665b03ebc13SStefano Zampini } 666b03ebc13SStefano Zampini } 667b03ebc13SStefano Zampini } 668b03ebc13SStefano Zampini ierr = MatRestoreRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 669b03ebc13SStefano Zampini } 670dec27d64SStefano Zampini ierr = MatSeqAIJRestoreArray(lGt,&vals);CHKERRQ(ierr); 671a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 672b03ebc13SStefano Zampini ierr = MatDestroy(&lGe);CHKERRQ(ierr); 673a13144ffSStefano Zampini 674a13144ffSStefano Zampini /* Get the local G^T explicitly */ 6750569b399SStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 676a13144ffSStefano Zampini ierr = MatTranspose(lG,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 6774e64d54eSstefano_zampini ierr = MatSetOption(lGt,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr); 678a13144ffSStefano Zampini 6794e64d54eSstefano_zampini /* Mark interior nodal dofs */ 680a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 6814e64d54eSstefano_zampini ierr = PetscBTCreate(nv,&btvi);CHKERRQ(ierr); 682a13144ffSStefano Zampini for (i=1;i<n_neigh;i++) { 683a13144ffSStefano Zampini for (j=0;j<n_shared[i];j++) { 6844e64d54eSstefano_zampini ierr = PetscBTSet(btvi,shared[i][j]);CHKERRQ(ierr); 685a13144ffSStefano Zampini } 686a13144ffSStefano Zampini } 687a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 688a13144ffSStefano Zampini 689a13144ffSStefano Zampini /* communicate corners and splitpoints */ 690a13144ffSStefano Zampini ierr = PetscMalloc1(nv,&vmarks);CHKERRQ(ierr); 691a13144ffSStefano Zampini ierr = PetscMemzero(sfvleaves,nv*sizeof(PetscInt));CHKERRQ(ierr); 692a13144ffSStefano Zampini ierr = PetscMemzero(sfvroots,Lv*sizeof(PetscInt));CHKERRQ(ierr); 693a13144ffSStefano Zampini for (i=0;i<nv;i++) if (PetscUnlikely(PetscBTLookup(btv,i))) sfvleaves[i] = 1; 694a13144ffSStefano Zampini 695a13144ffSStefano Zampini if (print) { 696a13144ffSStefano Zampini IS tbz; 697a13144ffSStefano Zampini 698a13144ffSStefano Zampini cum = 0; 699a13144ffSStefano Zampini for (i=0;i<nv;i++) 700a13144ffSStefano Zampini if (sfvleaves[i]) 701a13144ffSStefano Zampini vmarks[cum++] = i; 702a13144ffSStefano Zampini 703a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,vmarks,PETSC_COPY_VALUES,&tbz);CHKERRQ(ierr); 704a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)tbz,"corners_to_be_zeroed_local");CHKERRQ(ierr); 705a13144ffSStefano Zampini ierr = ISView(tbz,NULL);CHKERRQ(ierr); 706a13144ffSStefano Zampini ierr = ISDestroy(&tbz);CHKERRQ(ierr); 707a13144ffSStefano Zampini } 708a13144ffSStefano Zampini 709a13144ffSStefano Zampini ierr = PetscSFReduceBegin(sfv,MPIU_INT,sfvleaves,sfvroots,MPI_SUM);CHKERRQ(ierr); 710a13144ffSStefano Zampini ierr = PetscSFReduceEnd(sfv,MPIU_INT,sfvleaves,sfvroots,MPI_SUM);CHKERRQ(ierr); 711a13144ffSStefano Zampini ierr = PetscSFBcastBegin(sfv,MPIU_INT,sfvroots,sfvleaves);CHKERRQ(ierr); 712a13144ffSStefano Zampini ierr = PetscSFBcastEnd(sfv,MPIU_INT,sfvroots,sfvleaves);CHKERRQ(ierr); 713a13144ffSStefano Zampini 7144e64d54eSstefano_zampini /* Zero rows of lGt corresponding to identified corners 7154e64d54eSstefano_zampini and interior nodal dofs */ 716a13144ffSStefano Zampini cum = 0; 717a13144ffSStefano Zampini for (i=0;i<nv;i++) { 718a13144ffSStefano Zampini if (sfvleaves[i]) { 719a13144ffSStefano Zampini vmarks[cum++] = i; 720a13144ffSStefano Zampini ierr = PetscBTSet(btv,i);CHKERRQ(ierr); 721a13144ffSStefano Zampini } 7224e64d54eSstefano_zampini if (!PetscBTLookup(btvi,i)) vmarks[cum++] = i; 723a13144ffSStefano Zampini } 7244e64d54eSstefano_zampini ierr = PetscBTDestroy(&btvi);CHKERRQ(ierr); 725a13144ffSStefano Zampini if (print) { 726a13144ffSStefano Zampini IS tbz; 727a13144ffSStefano Zampini 728a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,vmarks,PETSC_COPY_VALUES,&tbz);CHKERRQ(ierr); 7294e64d54eSstefano_zampini ierr = PetscObjectSetName((PetscObject)tbz,"corners_to_be_zeroed_with_interior");CHKERRQ(ierr); 730a13144ffSStefano Zampini ierr = ISView(tbz,NULL);CHKERRQ(ierr); 731a13144ffSStefano Zampini ierr = ISDestroy(&tbz);CHKERRQ(ierr); 732a13144ffSStefano Zampini } 733a13144ffSStefano Zampini ierr = MatZeroRows(lGt,cum,vmarks,0.,NULL,NULL);CHKERRQ(ierr); 734a13144ffSStefano Zampini ierr = PetscFree(vmarks);CHKERRQ(ierr); 735a13144ffSStefano Zampini ierr = PetscSFDestroy(&sfv);CHKERRQ(ierr); 736a13144ffSStefano Zampini ierr = PetscFree2(sfvleaves,sfvroots);CHKERRQ(ierr); 737a13144ffSStefano Zampini 738a13144ffSStefano Zampini /* Recompute G */ 739a13144ffSStefano Zampini ierr = MatDestroy(&lG);CHKERRQ(ierr); 740a13144ffSStefano Zampini ierr = MatTranspose(lGt,MAT_INITIAL_MATRIX,&lG);CHKERRQ(ierr); 741a13144ffSStefano Zampini if (print) { 742a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)lG,"used_lG");CHKERRQ(ierr); 743a13144ffSStefano Zampini ierr = MatView(lG,NULL);CHKERRQ(ierr); 744a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)lGt,"used_lGt");CHKERRQ(ierr); 745a13144ffSStefano Zampini ierr = MatView(lGt,NULL);CHKERRQ(ierr); 746a13144ffSStefano Zampini } 747a13144ffSStefano Zampini 748a13144ffSStefano Zampini /* Get primal dofs (if any) */ 749a13144ffSStefano Zampini cum = 0; 750a13144ffSStefano Zampini for (i=0;i<ne;i++) { 751a13144ffSStefano Zampini if (PetscUnlikely(PetscBTLookup(bte,i))) marks[cum++] = i; 752a13144ffSStefano Zampini } 753c2151214SStefano Zampini if (fl2g) { 754c2151214SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,cum,marks,marks);CHKERRQ(ierr); 755c2151214SStefano Zampini } 756a13144ffSStefano Zampini ierr = ISCreateGeneral(comm,cum,marks,PETSC_COPY_VALUES,&primals);CHKERRQ(ierr); 757a13144ffSStefano Zampini if (print) { 758a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)primals,"prescribed_primal_dofs");CHKERRQ(ierr); 759a13144ffSStefano Zampini ierr = ISView(primals,NULL);CHKERRQ(ierr); 760a13144ffSStefano Zampini } 761a13144ffSStefano Zampini ierr = PetscBTDestroy(&bte);CHKERRQ(ierr); 762c2151214SStefano Zampini /* TODO: what if the user passed in some of them ? */ 763a13144ffSStefano Zampini ierr = PCBDDCSetPrimalVerticesLocalIS(pc,primals);CHKERRQ(ierr); 764a13144ffSStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 765a13144ffSStefano Zampini 766a13144ffSStefano Zampini /* Compute edge connectivity */ 767a13144ffSStefano Zampini ierr = PetscObjectSetOptionsPrefix((PetscObject)lG,"econn_");CHKERRQ(ierr); 768a13144ffSStefano Zampini ierr = MatMatMultSymbolic(lG,lGt,PETSC_DEFAULT,&conn);CHKERRQ(ierr); 769a13144ffSStefano Zampini ierr = MatGetRowIJ(conn,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 770c2151214SStefano Zampini if (fl2g) { 771c2151214SStefano Zampini PetscBT btf; 772c2151214SStefano Zampini PetscInt *iia,*jja,*iiu,*jju; 773c2151214SStefano Zampini PetscBool rest = PETSC_FALSE,free = PETSC_FALSE; 774c2151214SStefano Zampini 775c2151214SStefano Zampini /* create CSR for all local dofs */ 776c2151214SStefano Zampini ierr = PetscMalloc1(n+1,&iia);CHKERRQ(ierr); 777c2151214SStefano Zampini if (pcbddc->mat_graph->nvtxs_csr) { /* the user has passed in a CSR graph */ 778c2151214SStefano Zampini if (pcbddc->mat_graph->nvtxs_csr != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"Invalid size of CSR graph %d. Should be %d\n",pcbddc->mat_graph->nvtxs_csr,n); 779c2151214SStefano Zampini iiu = pcbddc->mat_graph->xadj; 780c2151214SStefano Zampini jju = pcbddc->mat_graph->adjncy; 781c2151214SStefano Zampini } else if (pcbddc->use_local_adj) { 782c2151214SStefano Zampini rest = PETSC_TRUE; 783c2151214SStefano Zampini ierr = MatGetRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&i,(const PetscInt**)&iiu,(const PetscInt**)&jju,&done);CHKERRQ(ierr); 784c2151214SStefano Zampini } else { 785c2151214SStefano Zampini free = PETSC_TRUE; 786c2151214SStefano Zampini ierr = PetscMalloc2(n+1,&iiu,n,&jju);CHKERRQ(ierr); 787c2151214SStefano Zampini iiu[0] = 0; 788c2151214SStefano Zampini for (i=0;i<n;i++) { 789c2151214SStefano Zampini iiu[i+1] = i+1; 790c2151214SStefano Zampini jju[i] = -1; 791d904f53bSStefano Zampini } 792c2151214SStefano Zampini } 793c2151214SStefano Zampini 794c2151214SStefano Zampini /* import sizes of CSR */ 795c2151214SStefano Zampini iia[0] = 0; 796c2151214SStefano Zampini for (i=0;i<n;i++) iia[i+1] = iiu[i+1]-iiu[i]; 797c2151214SStefano Zampini 798c2151214SStefano Zampini /* overwrite entries corresponding to the Nedelec field */ 799c2151214SStefano Zampini ierr = PetscBTCreate(n,&btf);CHKERRQ(ierr); 800c2151214SStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 801c2151214SStefano Zampini for (i=0;i<ne;i++) { 802c2151214SStefano Zampini ierr = PetscBTSet(btf,idxs[i]);CHKERRQ(ierr); 803c2151214SStefano Zampini iia[idxs[i]+1] = ii[i+1]-ii[i]; 804c2151214SStefano Zampini } 805c2151214SStefano Zampini 806c2151214SStefano Zampini /* iia in CSR */ 807c2151214SStefano Zampini for (i=0;i<n;i++) iia[i+1] += iia[i]; 808c2151214SStefano Zampini 809c2151214SStefano Zampini /* jja in CSR */ 810c2151214SStefano Zampini ierr = PetscMalloc1(iia[n],&jja);CHKERRQ(ierr); 811c2151214SStefano Zampini for (i=0;i<n;i++) 812c2151214SStefano Zampini if (!PetscBTLookup(btf,i)) 813c2151214SStefano Zampini for (j=0;j<iiu[i+1]-iiu[i];j++) 814c2151214SStefano Zampini jja[iia[i]+j] = jju[iiu[i]+j]; 815c2151214SStefano Zampini 816c2151214SStefano Zampini /* map edge dofs connectivity */ 8171e0482f5SStefano Zampini if (jj) { 818c2151214SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,ii[ne],jj,(PetscInt *)jj);CHKERRQ(ierr); 819c2151214SStefano Zampini for (i=0;i<ne;i++) { 820c2151214SStefano Zampini PetscInt e = idxs[i]; 821c2151214SStefano Zampini for (j=0;j<ii[i+1]-ii[i];j++) jja[iia[e]+j] = jj[ii[i]+j]; 822c2151214SStefano Zampini } 8231e0482f5SStefano Zampini } 824c2151214SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 825c2151214SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,n,iia,jja,PETSC_OWN_POINTER);CHKERRQ(ierr); 826c2151214SStefano Zampini if (rest) { 827c2151214SStefano Zampini ierr = MatRestoreRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&i,(const PetscInt**)&iiu,(const PetscInt**)&jju,&done);CHKERRQ(ierr); 828c2151214SStefano Zampini } 829c2151214SStefano Zampini if (free) { 830c2151214SStefano Zampini ierr = PetscFree2(iiu,jju);CHKERRQ(ierr); 831c2151214SStefano Zampini } 832c2151214SStefano Zampini ierr = PetscBTDestroy(&btf);CHKERRQ(ierr); 833c2151214SStefano Zampini } else { 834c2151214SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,n,ii,jj,PETSC_USE_POINTER);CHKERRQ(ierr); 835c2151214SStefano Zampini } 836c2151214SStefano Zampini 837a13144ffSStefano Zampini /* Analyze interface for edge dofs */ 838a13144ffSStefano Zampini ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr); 839213b8bfaSStefano Zampini pcbddc->mat_graph->twodim = PETSC_FALSE; 840a13144ffSStefano Zampini 841a13144ffSStefano Zampini /* Get coarse edges in the edge space */ 842c2151214SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 843a13144ffSStefano Zampini ierr = MatRestoreRowIJ(conn,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 844a13144ffSStefano Zampini 845c2151214SStefano Zampini if (fl2g) { 846c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,allprimals,&primals);CHKERRQ(ierr); 847c2151214SStefano Zampini ierr = PetscMalloc1(nee,&eedges);CHKERRQ(ierr); 848c2151214SStefano Zampini for (i=0;i<nee;i++) { 849c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,alleedges[i],&eedges[i]);CHKERRQ(ierr); 850c2151214SStefano Zampini } 851c2151214SStefano Zampini } else { 852c2151214SStefano Zampini eedges = alleedges; 853c2151214SStefano Zampini primals = allprimals; 854c2151214SStefano Zampini } 855c2151214SStefano Zampini 856a13144ffSStefano Zampini /* Mark fine edge dofs with their coarse edge id */ 857a13144ffSStefano Zampini ierr = PetscMemzero(marks,ne*sizeof(PetscInt));CHKERRQ(ierr); 858c2151214SStefano Zampini ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr); 859c2151214SStefano Zampini ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr); 860c2151214SStefano Zampini for (i=0;i<cum;i++) marks[idxs[i]] = nee+1; 861c2151214SStefano Zampini ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr); 862c2151214SStefano Zampini if (print) { 863c2151214SStefano Zampini ierr = PetscObjectSetName((PetscObject)primals,"obtained_primal_dofs");CHKERRQ(ierr); 864c2151214SStefano Zampini ierr = ISView(primals,NULL);CHKERRQ(ierr); 865c2151214SStefano Zampini } 866c2151214SStefano Zampini 867c2151214SStefano Zampini maxsize = 0; 868a13144ffSStefano Zampini for (i=0;i<nee;i++) { 869a13144ffSStefano Zampini PetscInt size,mark = i+1; 870a13144ffSStefano Zampini 871a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 872a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 873a13144ffSStefano Zampini for (j=0;j<size;j++) marks[idxs[j]] = mark; 874a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 875a13144ffSStefano Zampini maxsize = PetscMax(maxsize,size); 876a13144ffSStefano Zampini } 877a13144ffSStefano Zampini 878a13144ffSStefano Zampini /* Find coarse edge endpoints */ 879a13144ffSStefano Zampini ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 880a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 881a13144ffSStefano Zampini for (i=0;i<nee;i++) { 882a13144ffSStefano Zampini PetscInt mark = i+1,size; 883a13144ffSStefano Zampini 884a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 8851e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 8861e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 887a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 888a13144ffSStefano Zampini if (print) { 889a13144ffSStefano Zampini PetscPrintf(PETSC_COMM_SELF,"ENDPOINTS ANALYSIS EDGE %d\n",i); 890a13144ffSStefano Zampini ISView(eedges[i],NULL); 891a13144ffSStefano Zampini } 892a13144ffSStefano Zampini for (j=0;j<size;j++) { 893a13144ffSStefano Zampini PetscInt k, ee = idxs[j]; 894a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," idx %d\n",ee); 895a13144ffSStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 896a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," inspect %d\n",jj[k]); 897a13144ffSStefano Zampini if (PetscBTLookup(btv,jj[k])) { 898a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," corner found (already set) %d\n",jj[k]); 899a13144ffSStefano Zampini } else if (PetscBTLookup(btvcand,jj[k])) { /* is it ok? */ 900a13144ffSStefano Zampini PetscInt k2; 901a13144ffSStefano Zampini PetscBool corner = PETSC_FALSE; 902a13144ffSStefano Zampini for (k2 = iit[jj[k]];k2 < iit[jj[k]+1];k2++) { 903c2151214SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," INSPECTING %d: mark %d (ref mark %d), boundary %d\n",jjt[k2],marks[jjt[k2]],mark,!!PetscBTLookup(btb,jjt[k2])); 904c2151214SStefano Zampini /* it's a corner if either is connected with an edge dof belonging to a different cc or 905c2151214SStefano Zampini if the edge dof lie on the natural part of the boundary */ 906c2151214SStefano Zampini if ((marks[jjt[k2]] && marks[jjt[k2]] != mark) || (!marks[jjt[k2]] && PetscBTLookup(btb,jjt[k2]))) { 907a13144ffSStefano Zampini corner = PETSC_TRUE; 908a13144ffSStefano Zampini break; 909a13144ffSStefano Zampini } 910a13144ffSStefano Zampini } 911a13144ffSStefano Zampini if (corner) { /* found the nodal dof corresponding to the endpoint of the edge */ 912a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," corner found %d\n",jj[k]); 913a13144ffSStefano Zampini ierr = PetscBTSet(btv,jj[k]);CHKERRQ(ierr); 914a13144ffSStefano Zampini } else { 915a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," no corners found\n"); 916a13144ffSStefano Zampini } 917a13144ffSStefano Zampini } 918a13144ffSStefano Zampini } 919a13144ffSStefano Zampini } 920a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 921a13144ffSStefano Zampini } 922a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 923a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 924c2151214SStefano Zampini ierr = PetscBTDestroy(&btb);CHKERRQ(ierr); 925a13144ffSStefano Zampini 926a13144ffSStefano Zampini /* Reset marked primal dofs */ 927a13144ffSStefano Zampini ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr); 928a13144ffSStefano Zampini ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr); 929a13144ffSStefano Zampini for (i=0;i<cum;i++) marks[idxs[i]] = 0; 930a13144ffSStefano Zampini ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr); 931a13144ffSStefano Zampini 9320569b399SStefano Zampini /* Now use the initial lG */ 9330569b399SStefano Zampini ierr = MatDestroy(&lG);CHKERRQ(ierr); 9340569b399SStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 9350569b399SStefano Zampini lG = lGinit; 9360569b399SStefano Zampini ierr = MatTranspose(lG,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 9370569b399SStefano Zampini 938a13144ffSStefano Zampini /* Compute extended cols indices */ 939b03ebc13SStefano Zampini ierr = PetscBTCreate(nv,&btvc);CHKERRQ(ierr); 940b03ebc13SStefano Zampini ierr = PetscBTCreate(nee,&bter);CHKERRQ(ierr); 941a13144ffSStefano Zampini ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 942a13144ffSStefano Zampini ierr = MatSeqAIJGetMaxRowNonzeros(lG,&i);CHKERRQ(ierr); 943a13144ffSStefano Zampini i *= maxsize; 944b03ebc13SStefano Zampini ierr = PetscCalloc1(nee,&extcols);CHKERRQ(ierr); 945a13144ffSStefano Zampini ierr = PetscMalloc2(i,&extrow,i,&gidxs);CHKERRQ(ierr); 946a13144ffSStefano Zampini eerr = PETSC_FALSE; 947a13144ffSStefano Zampini for (i=0;i<nee;i++) { 948b03ebc13SStefano Zampini PetscInt size,found = 0; 949a13144ffSStefano Zampini 950a13144ffSStefano Zampini cum = 0; 951a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 9521e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 9531e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 954a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 955b03ebc13SStefano Zampini ierr = PetscBTMemzero(nv,btvc);CHKERRQ(ierr); 956a13144ffSStefano Zampini for (j=0;j<size;j++) { 957a13144ffSStefano Zampini PetscInt k,ee = idxs[j]; 958b03ebc13SStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 959b03ebc13SStefano Zampini PetscInt vv = jj[k]; 960b03ebc13SStefano Zampini if (!PetscBTLookup(btv,vv)) extrow[cum++] = vv; 961b03ebc13SStefano Zampini else if (!PetscBTLookupSet(btvc,vv)) found++; 962b03ebc13SStefano Zampini } 963a13144ffSStefano Zampini } 964a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 965a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&cum,extrow);CHKERRQ(ierr); 966a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingApply(vl2g,cum,extrow,gidxs);CHKERRQ(ierr); 967a13144ffSStefano Zampini ierr = PetscSortIntWithArray(cum,gidxs,extrow);CHKERRQ(ierr); 968a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,extrow,PETSC_COPY_VALUES,&extcols[i]);CHKERRQ(ierr); 969a13144ffSStefano Zampini /* it may happen that endpoints are not defined at this point 970a13144ffSStefano Zampini if it is the case, mark this edge for a second pass */ 971b03ebc13SStefano Zampini if (cum != size -1 || found != 2) { 972b03ebc13SStefano Zampini ierr = PetscBTSet(bter,i);CHKERRQ(ierr); 973a13144ffSStefano Zampini if (print) { 974a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)eedges[i],"error_edge");CHKERRQ(ierr); 975a13144ffSStefano Zampini ierr = ISView(eedges[i],NULL);CHKERRQ(ierr); 976a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)extcols[i],"error_extcol");CHKERRQ(ierr); 977a13144ffSStefano Zampini ierr = ISView(extcols[i],NULL);CHKERRQ(ierr); 978a13144ffSStefano Zampini } 979a13144ffSStefano Zampini eerr = PETSC_TRUE; 980a13144ffSStefano Zampini } 981a13144ffSStefano Zampini } 9824e64d54eSstefano_zampini /* if (eerr) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected SIZE OF EDGE > EXTCOL FIRST PASS"); */ 983a13144ffSStefano Zampini ierr = MPIU_Allreduce(&eerr,&done,1,MPIU_BOOL,MPI_LOR,comm);CHKERRQ(ierr); 984a13144ffSStefano Zampini if (done) { 985a13144ffSStefano Zampini PetscInt *newprimals; 986a13144ffSStefano Zampini 987a13144ffSStefano Zampini ierr = PetscMalloc1(ne,&newprimals);CHKERRQ(ierr); 988a13144ffSStefano Zampini ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr); 989a13144ffSStefano Zampini ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr); 990a13144ffSStefano Zampini ierr = PetscMemcpy(newprimals,idxs,cum*sizeof(PetscInt));CHKERRQ(ierr); 991a13144ffSStefano Zampini ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr); 9920569b399SStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 993b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"DOING SECOND PASS (eerr %d)\n",eerr); 994a13144ffSStefano Zampini for (i=0;i<nee;i++) { 995b03ebc13SStefano Zampini PetscBool has_candidates = PETSC_FALSE; 996b03ebc13SStefano Zampini if (PetscBTLookup(bter,i)) { 997a13144ffSStefano Zampini PetscInt size,mark = i+1; 998a13144ffSStefano Zampini 999a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 1000a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1001c2151214SStefano Zampini /* for (j=0;j<size;j++) newprimals[cum++] = idxs[j]; */ 1002a13144ffSStefano Zampini for (j=0;j<size;j++) { 1003a13144ffSStefano Zampini PetscInt k,ee = idxs[j]; 1004b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"Inspecting edge dof %d [%d %d)\n",ee,ii[ee],ii[ee+1]); 1005a13144ffSStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 1006a13144ffSStefano Zampini /* set all candidates located on the edge as corners */ 1007a13144ffSStefano Zampini if (PetscBTLookup(btvcand,jj[k])) { 1008a13144ffSStefano Zampini PetscInt k2,vv = jj[k]; 1009b03ebc13SStefano Zampini has_candidates = PETSC_TRUE; 1010b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Candidate set to vertex %d\n",vv); 1011a13144ffSStefano Zampini ierr = PetscBTSet(btv,vv);CHKERRQ(ierr); 1012a13144ffSStefano Zampini /* set all edge dofs connected to candidate as primals */ 1013a13144ffSStefano Zampini for (k2=iit[vv];k2<iit[vv+1];k2++) { 1014a13144ffSStefano Zampini if (marks[jjt[k2]] == mark) { 1015a13144ffSStefano Zampini PetscInt k3,ee2 = jjt[k2]; 1016b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Connected edge dof set to primal %d\n",ee2); 1017a13144ffSStefano Zampini newprimals[cum++] = ee2; 1018a13144ffSStefano Zampini /* finally set the new corners */ 1019a13144ffSStefano Zampini for (k3=ii[ee2];k3<ii[ee2+1];k3++) { 1020b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Connected nodal dof set to vertex %d\n",jj[k3]); 1021a13144ffSStefano Zampini ierr = PetscBTSet(btv,jj[k3]);CHKERRQ(ierr); 1022a13144ffSStefano Zampini } 1023a13144ffSStefano Zampini } 1024a13144ffSStefano Zampini } 1025b03ebc13SStefano Zampini } else { 1026b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Not a candidate vertex %d\n",jj[k]); 1027a13144ffSStefano Zampini } 1028a13144ffSStefano Zampini } 1029a13144ffSStefano Zampini } 1030b03ebc13SStefano Zampini if (!has_candidates) { /* circular edge */ 1031b03ebc13SStefano Zampini PetscInt k, ee = idxs[0],*tmarks; 1032b03ebc13SStefano Zampini 1033b03ebc13SStefano Zampini ierr = PetscCalloc1(ne,&tmarks);CHKERRQ(ierr); 1034b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Circular edge %d\n",i); 1035b03ebc13SStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 1036b03ebc13SStefano Zampini PetscInt k2; 1037b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Set to corner %d\n",jj[k]); 1038b03ebc13SStefano Zampini ierr = PetscBTSet(btv,jj[k]);CHKERRQ(ierr); 1039b03ebc13SStefano Zampini for (k2=iit[jj[k]];k2<iit[jj[k]+1];k2++) tmarks[jjt[k2]]++; 1040b03ebc13SStefano Zampini } 1041b03ebc13SStefano Zampini for (j=0;j<size;j++) { 1042b03ebc13SStefano Zampini if (tmarks[idxs[j]] > 1) { 1043b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Edge dof set to primal %d\n",idxs[j]); 1044b03ebc13SStefano Zampini newprimals[cum++] = idxs[j]; 1045b03ebc13SStefano Zampini } 1046b03ebc13SStefano Zampini } 1047b03ebc13SStefano Zampini ierr = PetscFree(tmarks);CHKERRQ(ierr); 1048b03ebc13SStefano Zampini } 1049a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1050a13144ffSStefano Zampini } 1051a13144ffSStefano Zampini ierr = ISDestroy(&extcols[i]);CHKERRQ(ierr); 1052a13144ffSStefano Zampini } 1053b03ebc13SStefano Zampini ierr = PetscFree(extcols);CHKERRQ(ierr); 10540569b399SStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 1055a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&cum,newprimals);CHKERRQ(ierr); 1056c2151214SStefano Zampini if (fl2g) { 1057c2151214SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,cum,newprimals,newprimals);CHKERRQ(ierr); 1058c2151214SStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 1059c2151214SStefano Zampini for (i=0;i<nee;i++) { 1060c2151214SStefano Zampini ierr = ISDestroy(&eedges[i]);CHKERRQ(ierr); 1061c2151214SStefano Zampini } 1062c2151214SStefano Zampini ierr = PetscFree(eedges);CHKERRQ(ierr); 1063c2151214SStefano Zampini } 1064c2151214SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 1065a13144ffSStefano Zampini ierr = ISCreateGeneral(comm,cum,newprimals,PETSC_COPY_VALUES,&primals);CHKERRQ(ierr); 1066a13144ffSStefano Zampini ierr = PetscFree(newprimals);CHKERRQ(ierr); 1067a13144ffSStefano Zampini ierr = PCBDDCSetPrimalVerticesLocalIS(pc,primals);CHKERRQ(ierr); 1068a13144ffSStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 1069a13144ffSStefano Zampini ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr); 1070213b8bfaSStefano Zampini pcbddc->mat_graph->twodim = PETSC_FALSE; 1071c2151214SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 1072c2151214SStefano Zampini if (fl2g) { 1073c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,allprimals,&primals);CHKERRQ(ierr); 1074c2151214SStefano Zampini ierr = PetscMalloc1(nee,&eedges);CHKERRQ(ierr); 1075c2151214SStefano Zampini for (i=0;i<nee;i++) { 1076c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,alleedges[i],&eedges[i]);CHKERRQ(ierr); 1077c2151214SStefano Zampini } 1078c2151214SStefano Zampini } else { 1079c2151214SStefano Zampini eedges = alleedges; 1080c2151214SStefano Zampini primals = allprimals; 1081c2151214SStefano Zampini } 1082b03ebc13SStefano Zampini ierr = PetscCalloc1(nee,&extcols);CHKERRQ(ierr); 1083a13144ffSStefano Zampini 1084a13144ffSStefano Zampini /* Mark again */ 1085a13144ffSStefano Zampini ierr = PetscMemzero(marks,ne*sizeof(PetscInt));CHKERRQ(ierr); 1086a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1087a13144ffSStefano Zampini PetscInt size,mark = i+1; 1088a13144ffSStefano Zampini 1089a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 1090a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1091a13144ffSStefano Zampini for (j=0;j<size;j++) marks[idxs[j]] = mark; 1092a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1093a13144ffSStefano Zampini } 1094a13144ffSStefano Zampini if (print) { 1095a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)primals,"obtained_primal_dofs_secondpass");CHKERRQ(ierr); 1096a13144ffSStefano Zampini ierr = ISView(primals,NULL);CHKERRQ(ierr); 1097a13144ffSStefano Zampini } 1098a13144ffSStefano Zampini 1099a13144ffSStefano Zampini /* Recompute extended cols */ 1100a13144ffSStefano Zampini eerr = PETSC_FALSE; 1101a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1102a13144ffSStefano Zampini PetscInt size; 1103a13144ffSStefano Zampini 1104a13144ffSStefano Zampini cum = 0; 1105a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 11061e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 11071e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 1108a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1109a13144ffSStefano Zampini for (j=0;j<size;j++) { 1110a13144ffSStefano Zampini PetscInt k,ee = idxs[j]; 11111e0482f5SStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) if (!PetscBTLookup(btv,jj[k])) extrow[cum++] = jj[k]; 1112a13144ffSStefano Zampini } 1113a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1114a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&cum,extrow);CHKERRQ(ierr); 1115a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingApply(vl2g,cum,extrow,gidxs);CHKERRQ(ierr); 1116a13144ffSStefano Zampini ierr = PetscSortIntWithArray(cum,gidxs,extrow);CHKERRQ(ierr); 1117a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,extrow,PETSC_COPY_VALUES,&extcols[i]);CHKERRQ(ierr); 1118a13144ffSStefano Zampini if (cum != size -1) { 1119a13144ffSStefano Zampini if (print) { 1120a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)eedges[i],"error_edge_secondpass");CHKERRQ(ierr); 1121a13144ffSStefano Zampini ierr = ISView(eedges[i],NULL);CHKERRQ(ierr); 1122a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)extcols[i],"error_extcol_secondpass");CHKERRQ(ierr); 1123a13144ffSStefano Zampini ierr = ISView(extcols[i],NULL);CHKERRQ(ierr); 1124a13144ffSStefano Zampini } 1125a13144ffSStefano Zampini eerr = PETSC_TRUE; 1126a13144ffSStefano Zampini } 1127a13144ffSStefano Zampini } 1128a13144ffSStefano Zampini } 1129a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1130a13144ffSStefano Zampini ierr = PetscFree2(extrow,gidxs);CHKERRQ(ierr); 1131b03ebc13SStefano Zampini ierr = PetscBTDestroy(&bter);CHKERRQ(ierr); 11327d871cd7SStefano Zampini if (print) { ierr = PCBDDCGraphASCIIView(pcbddc->mat_graph,5,PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr); } 1133a13144ffSStefano Zampini /* an error should not occur at this point */ 1134a13144ffSStefano Zampini if (eerr) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected SIZE OF EDGE > EXTCOL SECOND PASS"); 1135a13144ffSStefano Zampini 11364e64d54eSstefano_zampini /* Check the number of endpoints */ 11370569b399SStefano Zampini ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1138b03ebc13SStefano Zampini ierr = PetscMalloc1(2*nee,&corners);CHKERRQ(ierr); 1139b03ebc13SStefano Zampini ierr = PetscMalloc1(nee,&cedges);CHKERRQ(ierr); 11404e64d54eSstefano_zampini for (i=0;i<nee;i++) { 1141b03ebc13SStefano Zampini PetscInt size, found = 0, gc[2]; 11424e64d54eSstefano_zampini 1143b03ebc13SStefano Zampini /* init with defaults */ 1144b03ebc13SStefano Zampini cedges[i] = corners[i*2] = corners[i*2+1] = -1; 11454e64d54eSstefano_zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 11461e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 11471e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 11484e64d54eSstefano_zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1149b03ebc13SStefano Zampini ierr = PetscBTMemzero(nv,btvc);CHKERRQ(ierr); 11504e64d54eSstefano_zampini for (j=0;j<size;j++) { 11514e64d54eSstefano_zampini PetscInt k,ee = idxs[j]; 11524e64d54eSstefano_zampini for (k=ii[ee];k<ii[ee+1];k++) { 11534e64d54eSstefano_zampini PetscInt vv = jj[k]; 11544e64d54eSstefano_zampini if (PetscBTLookup(btv,vv) && !PetscBTLookupSet(btvc,vv)) { 1155b03ebc13SStefano Zampini if (found == 2) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Found more then two corners for edge %d\n",i); 1156b03ebc13SStefano Zampini corners[i*2+found++] = vv; 11574e64d54eSstefano_zampini } 11584e64d54eSstefano_zampini } 11594e64d54eSstefano_zampini } 1160b03ebc13SStefano Zampini if (found != 2) { 1161b03ebc13SStefano Zampini PetscInt e; 1162b03ebc13SStefano Zampini if (fl2g) { 1163b03ebc13SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,1,idxs,&e);CHKERRQ(ierr); 1164b03ebc13SStefano Zampini } else { 1165b03ebc13SStefano Zampini e = idxs[0]; 1166b03ebc13SStefano Zampini } 1167b03ebc13SStefano Zampini SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Found %d corners for edge %d (astart %d, estart %d)\n",found,i,e,idxs[0]); 1168b03ebc13SStefano Zampini } 1169eee23b56SStefano Zampini 1170eee23b56SStefano Zampini /* get primal dof index on this coarse edge */ 1171b03ebc13SStefano Zampini ierr = ISLocalToGlobalMappingApply(vl2g,2,corners+2*i,gc);CHKERRQ(ierr); 1172b03ebc13SStefano Zampini if (gc[0] > gc[1]) { 1173b03ebc13SStefano Zampini PetscInt swap = corners[2*i]; 1174b03ebc13SStefano Zampini corners[2*i] = corners[2*i+1]; 1175b03ebc13SStefano Zampini corners[2*i+1] = swap; 1176b03ebc13SStefano Zampini } 1177eee23b56SStefano Zampini cedges[i] = idxs[size-1]; 11784e64d54eSstefano_zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1179b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"EDGE %d: ce %d, corners (%d,%d)\n",i,cedges[i],corners[2*i],corners[2*i+1]); 11804e64d54eSstefano_zampini } 11810569b399SStefano Zampini ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 11824e64d54eSstefano_zampini ierr = PetscBTDestroy(&btvc);CHKERRQ(ierr); 11834e64d54eSstefano_zampini 1184a13144ffSStefano Zampini #if defined(PETSC_USE_DEBUG) 1185a13144ffSStefano Zampini /* Inspects columns of lG (rows of lGt) and make sure the change of basis will 1186a13144ffSStefano Zampini not interfere with neighbouring coarse edges */ 1187a13144ffSStefano Zampini ierr = PetscMalloc1(nee+1,&emarks);CHKERRQ(ierr); 1188a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1189a13144ffSStefano Zampini for (i=0;i<nv;i++) { 1190a13144ffSStefano Zampini PetscInt emax = 0,eemax = 0; 1191a13144ffSStefano Zampini 1192a13144ffSStefano Zampini if (ii[i+1]==ii[i] || PetscBTLookup(btv,i)) continue; 1193a13144ffSStefano Zampini ierr = PetscMemzero(emarks,(nee+1)*sizeof(PetscInt));CHKERRQ(ierr); 1194a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) emarks[marks[jj[j]]]++; 1195a13144ffSStefano Zampini for (j=1;j<nee+1;j++) { 1196a13144ffSStefano Zampini if (emax < emarks[j]) { 1197a13144ffSStefano Zampini emax = emarks[j]; 1198a13144ffSStefano Zampini eemax = j; 1199a13144ffSStefano Zampini } 1200a13144ffSStefano Zampini } 1201a13144ffSStefano Zampini /* not relevant for edges */ 1202a13144ffSStefano Zampini if (!eemax) continue; 1203a13144ffSStefano Zampini 1204a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 1205a13144ffSStefano Zampini if (marks[jj[j]] && marks[jj[j]] != eemax) { 1206c2151214SStefano Zampini SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_SUP,"Found 2 coarse edges (id %d and %d) connected through the %d nodal dof at edge dof %d\n",marks[jj[j]]-1,eemax,i,jj[j]); 1207a13144ffSStefano Zampini } 1208a13144ffSStefano Zampini } 1209a13144ffSStefano Zampini } 1210a13144ffSStefano Zampini ierr = PetscFree(emarks);CHKERRQ(ierr); 1211a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1212a13144ffSStefano Zampini #endif 1213a13144ffSStefano Zampini 1214a13144ffSStefano Zampini /* Compute extended rows indices for edge blocks of the change of basis */ 1215a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1216a13144ffSStefano Zampini ierr = MatSeqAIJGetMaxRowNonzeros(lGt,&extmem);CHKERRQ(ierr); 1217a13144ffSStefano Zampini extmem *= maxsize; 1218a13144ffSStefano Zampini ierr = PetscMalloc1(extmem*nee,&extrow);CHKERRQ(ierr); 1219a13144ffSStefano Zampini ierr = PetscMalloc1(nee,&extrows);CHKERRQ(ierr); 1220a13144ffSStefano Zampini ierr = PetscCalloc1(nee,&extrowcum);CHKERRQ(ierr); 1221a13144ffSStefano Zampini for (i=0;i<nv;i++) { 1222a13144ffSStefano Zampini PetscInt mark = 0,size,start; 1223213b8bfaSStefano Zampini 1224a13144ffSStefano Zampini if (ii[i+1]==ii[i] || PetscBTLookup(btv,i)) continue; 1225a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) 1226a13144ffSStefano Zampini if (marks[jj[j]] && !mark) 1227a13144ffSStefano Zampini mark = marks[jj[j]]; 1228a13144ffSStefano Zampini 1229a13144ffSStefano Zampini /* not relevant */ 1230a13144ffSStefano Zampini if (!mark) continue; 1231a13144ffSStefano Zampini 1232a13144ffSStefano Zampini /* import extended row */ 1233a13144ffSStefano Zampini mark--; 1234a13144ffSStefano Zampini start = mark*extmem+extrowcum[mark]; 1235a13144ffSStefano Zampini size = ii[i+1]-ii[i]; 1236a13144ffSStefano Zampini if (extrowcum[mark] + size > extmem) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Not enough memory allocated %d > %d",extrowcum[mark] + size,extmem); 1237a13144ffSStefano Zampini ierr = PetscMemcpy(extrow+start,jj+ii[i],size*sizeof(PetscInt));CHKERRQ(ierr); 1238a13144ffSStefano Zampini extrowcum[mark] += size; 1239a13144ffSStefano Zampini } 1240a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1241213b8bfaSStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 1242213b8bfaSStefano Zampini ierr = PetscFree(marks);CHKERRQ(ierr); 1243213b8bfaSStefano Zampini 1244213b8bfaSStefano Zampini /* Compress extrows */ 1245a13144ffSStefano Zampini cum = 0; 1246a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1247a13144ffSStefano Zampini PetscInt size = extrowcum[i],*start = extrow + i*extmem; 1248a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&size,start);CHKERRQ(ierr); 1249a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,size,start,PETSC_USE_POINTER,&extrows[i]);CHKERRQ(ierr); 1250a13144ffSStefano Zampini cum = PetscMax(cum,size); 1251a13144ffSStefano Zampini } 1252a13144ffSStefano Zampini ierr = PetscFree(extrowcum);CHKERRQ(ierr); 1253a13144ffSStefano Zampini ierr = PetscBTDestroy(&btv);CHKERRQ(ierr); 1254a13144ffSStefano Zampini ierr = PetscBTDestroy(&btvcand);CHKERRQ(ierr); 1255a13144ffSStefano Zampini 1256a13144ffSStefano Zampini /* Workspace for lapack inner calls and VecSetValues */ 1257a13144ffSStefano Zampini ierr = PetscMalloc2((5+cum+maxsize)*maxsize,&work,maxsize,&rwork);CHKERRQ(ierr); 1258a13144ffSStefano Zampini 1259a13144ffSStefano Zampini /* Create change of basis matrix (preallocation can be improved) */ 1260a13144ffSStefano Zampini ierr = MatCreate(comm,&T);CHKERRQ(ierr); 1261c2151214SStefano Zampini ierr = MatSetSizes(T,pc->pmat->rmap->n,pc->pmat->rmap->n, 1262c2151214SStefano Zampini pc->pmat->rmap->N,pc->pmat->rmap->N);CHKERRQ(ierr); 1263a13144ffSStefano Zampini ierr = MatSetType(T,MATAIJ);CHKERRQ(ierr); 1264a13144ffSStefano Zampini ierr = MatSeqAIJSetPreallocation(T,10,NULL);CHKERRQ(ierr); 1265a13144ffSStefano Zampini ierr = MatMPIAIJSetPreallocation(T,10,NULL,10,NULL);CHKERRQ(ierr); 12661e0482f5SStefano Zampini ierr = MatSetLocalToGlobalMapping(T,al2g,al2g);CHKERRQ(ierr); 1267a13144ffSStefano Zampini ierr = MatSetOption(T,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 1268a13144ffSStefano Zampini ierr = MatSetOption(T,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); 1269213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&al2g);CHKERRQ(ierr); 1270a13144ffSStefano Zampini 1271a13144ffSStefano Zampini /* Defaults to identity */ 1272c2151214SStefano Zampini ierr = MatCreateVecs(pc->pmat,&tvec,NULL);CHKERRQ(ierr); 1273a13144ffSStefano Zampini ierr = VecSet(tvec,1.0);CHKERRQ(ierr); 1274a13144ffSStefano Zampini ierr = MatDiagonalSet(T,tvec,INSERT_VALUES);CHKERRQ(ierr); 1275a13144ffSStefano Zampini ierr = VecDestroy(&tvec);CHKERRQ(ierr); 1276a13144ffSStefano Zampini 12771e0482f5SStefano Zampini /* Create discrete gradient for the coarser level if needed */ 12781e0482f5SStefano Zampini ierr = MatDestroy(&pcbddc->nedcG);CHKERRQ(ierr); 12791e0482f5SStefano Zampini ierr = ISDestroy(&pcbddc->nedclocal);CHKERRQ(ierr); 12801e0482f5SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) { 12811e0482f5SStefano Zampini ISLocalToGlobalMapping cel2g,cvl2g; 12821e0482f5SStefano Zampini IS wis,gwis; 12831e0482f5SStefano Zampini PetscInt cnv,cne; 12841e0482f5SStefano Zampini 12851e0482f5SStefano Zampini ierr = ISCreateGeneral(comm,nee,cedges,PETSC_COPY_VALUES,&wis);CHKERRQ(ierr); 12861e0482f5SStefano Zampini if (fl2g) { 12871e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(fl2g,wis,&pcbddc->nedclocal);CHKERRQ(ierr); 12881e0482f5SStefano Zampini } else { 12891e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)wis);CHKERRQ(ierr); 12901e0482f5SStefano Zampini pcbddc->nedclocal = wis; 12911e0482f5SStefano Zampini } 12921e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(el2g,wis,&gwis);CHKERRQ(ierr); 12931e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 12941e0482f5SStefano Zampini ierr = ISRenumber(gwis,NULL,&cne,&wis);CHKERRQ(ierr); 12951e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(wis,&cel2g);CHKERRQ(ierr); 12961e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 12971e0482f5SStefano Zampini ierr = ISDestroy(&gwis);CHKERRQ(ierr); 12981e0482f5SStefano Zampini 12991e0482f5SStefano Zampini ierr = ISCreateGeneral(comm,2*nee,corners,PETSC_USE_POINTER,&wis);CHKERRQ(ierr); 13001e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(vl2g,wis,&gwis);CHKERRQ(ierr); 13011e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 13021e0482f5SStefano Zampini ierr = ISRenumber(gwis,NULL,&cnv,&wis);CHKERRQ(ierr); 13031e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(wis,&cvl2g);CHKERRQ(ierr); 13041e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 13051e0482f5SStefano Zampini ierr = ISDestroy(&gwis);CHKERRQ(ierr); 13061e0482f5SStefano Zampini 13071e0482f5SStefano Zampini ierr = MatCreate(comm,&pcbddc->nedcG);CHKERRQ(ierr); 13081e0482f5SStefano Zampini ierr = MatSetSizes(pcbddc->nedcG,PETSC_DECIDE,PETSC_DECIDE,cne,cnv);CHKERRQ(ierr); 13091e0482f5SStefano Zampini ierr = MatSetType(pcbddc->nedcG,MATAIJ);CHKERRQ(ierr); 13101e0482f5SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->nedcG,2,NULL);CHKERRQ(ierr); 13111e0482f5SStefano Zampini ierr = MatMPIAIJSetPreallocation(pcbddc->nedcG,2,NULL,2,NULL);CHKERRQ(ierr); 13121e0482f5SStefano Zampini ierr = MatSetLocalToGlobalMapping(pcbddc->nedcG,cel2g,cvl2g);CHKERRQ(ierr); 13131e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cel2g);CHKERRQ(ierr); 13141e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cvl2g);CHKERRQ(ierr); 13151e0482f5SStefano Zampini } 1316213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&vl2g);CHKERRQ(ierr); 13171e0482f5SStefano Zampini 13181e0482f5SStefano Zampini #if defined(PRINT_GDET) 13191e0482f5SStefano Zampini inc = 0; 13201e0482f5SStefano Zampini lev = pcbddc->current_level; 13211e0482f5SStefano Zampini #endif 1322213b8bfaSStefano Zampini 1323213b8bfaSStefano Zampini /* Insert values in the change of basis matrix */ 1324a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1325a13144ffSStefano Zampini Mat Gins = NULL, GKins = NULL; 13261e0482f5SStefano Zampini IS cornersis = NULL; 13271e0482f5SStefano Zampini PetscScalar cvals[2]; 1328a13144ffSStefano Zampini 13291e0482f5SStefano Zampini if (pcbddc->nedcG) { 13301e0482f5SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,2,corners+2*i,PETSC_USE_POINTER,&cornersis);CHKERRQ(ierr); 13311e0482f5SStefano Zampini } 13321e0482f5SStefano Zampini ierr = PCBDDCComputeNedelecChangeEdge(lG,eedges[i],extrows[i],extcols[i],cornersis,&Gins,&GKins,cvals,work,rwork);CHKERRQ(ierr); 1333a13144ffSStefano Zampini if (Gins && GKins) { 1334a13144ffSStefano Zampini PetscScalar *data; 1335a13144ffSStefano Zampini const PetscInt *rows,*cols; 1336a13144ffSStefano Zampini PetscInt nrh,nch,nrc,ncc; 1337a13144ffSStefano Zampini 1338a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&cols);CHKERRQ(ierr); 1339a13144ffSStefano Zampini /* H1 */ 1340a13144ffSStefano Zampini ierr = ISGetIndices(extrows[i],&rows);CHKERRQ(ierr); 1341a13144ffSStefano Zampini ierr = MatGetSize(Gins,&nrh,&nch);CHKERRQ(ierr); 1342a13144ffSStefano Zampini ierr = MatDenseGetArray(Gins,&data);CHKERRQ(ierr); 1343a13144ffSStefano Zampini ierr = MatSetValuesLocal(T,nrh,rows,nch,cols,data,INSERT_VALUES);CHKERRQ(ierr); 1344a13144ffSStefano Zampini ierr = MatDenseRestoreArray(Gins,&data);CHKERRQ(ierr); 1345a13144ffSStefano Zampini ierr = ISRestoreIndices(extrows[i],&rows);CHKERRQ(ierr); 1346a13144ffSStefano Zampini /* complement */ 1347a13144ffSStefano Zampini ierr = MatGetSize(GKins,&nrc,&ncc);CHKERRQ(ierr); 13481e0482f5SStefano Zampini if (!ncc) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Constant function has not been generated for coarse edge %d",i); 1349213b8bfaSStefano Zampini if (ncc + nch != nrc) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"The sum of the number of columns of GKins %d and Gins %d does not match %d for coarse edge %d",ncc,nch,nrc,i); 1350213b8bfaSStefano Zampini if (ncc != 1 && pcbddc->nedcG) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot generate the coarse discrete gradient for coarse edge %d with ncc %d",i,ncc); 1351a13144ffSStefano Zampini ierr = MatDenseGetArray(GKins,&data);CHKERRQ(ierr); 1352a13144ffSStefano Zampini ierr = MatSetValuesLocal(T,nrc,cols,ncc,cols+nch,data,INSERT_VALUES);CHKERRQ(ierr); 1353a13144ffSStefano Zampini ierr = MatDenseRestoreArray(GKins,&data);CHKERRQ(ierr); 13541e0482f5SStefano Zampini 13551e0482f5SStefano Zampini /* coarse discrete gradient */ 13561e0482f5SStefano Zampini if (pcbddc->nedcG) { 13571e0482f5SStefano Zampini PetscInt cols[2]; 13581e0482f5SStefano Zampini 13591e0482f5SStefano Zampini cols[0] = 2*i; 13601e0482f5SStefano Zampini cols[1] = 2*i+1; 13611e0482f5SStefano Zampini ierr = MatSetValuesLocal(pcbddc->nedcG,1,&i,2,cols,cvals,INSERT_VALUES);CHKERRQ(ierr); 13621e0482f5SStefano Zampini } 1363a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&cols);CHKERRQ(ierr); 1364a13144ffSStefano Zampini } 1365a13144ffSStefano Zampini ierr = ISDestroy(&extrows[i]);CHKERRQ(ierr); 1366a13144ffSStefano Zampini ierr = ISDestroy(&extcols[i]);CHKERRQ(ierr); 13671e0482f5SStefano Zampini ierr = ISDestroy(&cornersis);CHKERRQ(ierr); 1368a13144ffSStefano Zampini ierr = MatDestroy(&Gins);CHKERRQ(ierr); 1369a13144ffSStefano Zampini ierr = MatDestroy(&GKins);CHKERRQ(ierr); 1370a13144ffSStefano Zampini } 1371213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&el2g);CHKERRQ(ierr); 1372a13144ffSStefano Zampini 1373a13144ffSStefano Zampini /* Start assembling */ 1374a13144ffSStefano Zampini ierr = MatAssemblyBegin(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13751e0482f5SStefano Zampini if (pcbddc->nedcG) { 13761e0482f5SStefano Zampini ierr = MatAssemblyBegin(pcbddc->nedcG,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13771e0482f5SStefano Zampini } 1378a13144ffSStefano Zampini 1379a13144ffSStefano Zampini /* Free */ 1380c2151214SStefano Zampini if (fl2g) { 1381c2151214SStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 1382c2151214SStefano Zampini for (i=0;i<nee;i++) { 1383c2151214SStefano Zampini ierr = ISDestroy(&eedges[i]);CHKERRQ(ierr); 1384c2151214SStefano Zampini } 1385c2151214SStefano Zampini ierr = PetscFree(eedges);CHKERRQ(ierr); 1386c2151214SStefano Zampini } 1387eee23b56SStefano Zampini 1388eee23b56SStefano Zampini /* hack mat_graph with primal dofs on the coarse edges */ 1389eee23b56SStefano Zampini { 1390eee23b56SStefano Zampini PCBDDCGraph graph = pcbddc->mat_graph; 1391eee23b56SStefano Zampini PetscInt *oqueue = graph->queue; 1392eee23b56SStefano Zampini PetscInt *ocptr = graph->cptr; 1393eee23b56SStefano Zampini PetscInt ncc,*idxs; 1394eee23b56SStefano Zampini 1395eee23b56SStefano Zampini /* find first primal edge */ 1396eee23b56SStefano Zampini if (pcbddc->nedclocal) { 1397eee23b56SStefano Zampini ierr = ISGetIndices(pcbddc->nedclocal,(const PetscInt**)&idxs);CHKERRQ(ierr); 1398eee23b56SStefano Zampini } else { 1399eee23b56SStefano Zampini if (fl2g) { 1400eee23b56SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,nee,cedges,cedges);CHKERRQ(ierr); 1401eee23b56SStefano Zampini } 1402eee23b56SStefano Zampini idxs = cedges; 1403eee23b56SStefano Zampini } 1404eee23b56SStefano Zampini cum = 0; 1405eee23b56SStefano Zampini while (cum < nee && cedges[cum] < 0) cum++; 1406eee23b56SStefano Zampini 1407eee23b56SStefano Zampini /* adapt connected components */ 1408eee23b56SStefano Zampini ierr = PetscMalloc2(graph->nvtxs+1,&graph->cptr,ocptr[graph->ncc],&graph->queue);CHKERRQ(ierr); 1409eee23b56SStefano Zampini graph->cptr[0] = 0; 1410eee23b56SStefano Zampini for (i=0,ncc=0;i<graph->ncc;i++) { 1411eee23b56SStefano Zampini PetscInt lc = ocptr[i+1]-ocptr[i]; 1412eee23b56SStefano Zampini if (cum != nee && oqueue[ocptr[i+1]-1] == cedges[cum]) { /* this cc has a primal dof */ 1413eee23b56SStefano Zampini graph->cptr[ncc+1] = graph->cptr[ncc]+1; 1414eee23b56SStefano Zampini graph->queue[graph->cptr[ncc]] = cedges[cum]; 1415eee23b56SStefano Zampini ncc++; 1416eee23b56SStefano Zampini lc--; 1417eee23b56SStefano Zampini cum++; 1418eee23b56SStefano Zampini while (cum < nee && cedges[cum] < 0) cum++; 1419eee23b56SStefano Zampini } 1420eee23b56SStefano Zampini graph->cptr[ncc+1] = graph->cptr[ncc] + lc; 1421eee23b56SStefano Zampini for (j=0;j<lc;j++) graph->queue[graph->cptr[ncc]+j] = oqueue[ocptr[i]+j]; 1422eee23b56SStefano Zampini ncc++; 1423eee23b56SStefano Zampini } 1424eee23b56SStefano Zampini graph->ncc = ncc; 1425eee23b56SStefano Zampini if (pcbddc->nedclocal) { 1426eee23b56SStefano Zampini ierr = ISRestoreIndices(pcbddc->nedclocal,(const PetscInt**)&idxs);CHKERRQ(ierr); 1427eee23b56SStefano Zampini } 1428eee23b56SStefano Zampini ierr = PetscFree2(ocptr,oqueue);CHKERRQ(ierr); 1429eee23b56SStefano Zampini } 1430213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&fl2g);CHKERRQ(ierr); 1431c2151214SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 1432c2151214SStefano Zampini ierr = PCBDDCGraphResetCSR(pcbddc->mat_graph);CHKERRQ(ierr); 1433213b8bfaSStefano Zampini ierr = MatDestroy(&conn);CHKERRQ(ierr); 1434eee23b56SStefano Zampini 1435c2151214SStefano Zampini ierr = ISDestroy(&nedfieldlocal);CHKERRQ(ierr); 1436a13144ffSStefano Zampini ierr = PetscFree(extrow);CHKERRQ(ierr); 1437a13144ffSStefano Zampini ierr = PetscFree2(work,rwork);CHKERRQ(ierr); 1438b03ebc13SStefano Zampini ierr = PetscFree(corners);CHKERRQ(ierr); 1439b03ebc13SStefano Zampini ierr = PetscFree(cedges);CHKERRQ(ierr); 1440a13144ffSStefano Zampini ierr = PetscFree(extrows);CHKERRQ(ierr); 1441a13144ffSStefano Zampini ierr = PetscFree(extcols);CHKERRQ(ierr); 1442a13144ffSStefano Zampini ierr = MatDestroy(&lG);CHKERRQ(ierr); 1443a13144ffSStefano Zampini 1444a13144ffSStefano Zampini /* Complete assembling */ 1445a13144ffSStefano Zampini ierr = MatAssemblyEnd(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14461e0482f5SStefano Zampini if (pcbddc->nedcG) { 14471e0482f5SStefano Zampini ierr = MatAssemblyEnd(pcbddc->nedcG,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14481e0482f5SStefano Zampini #if 0 14491e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->nedcG,"coarse_G");CHKERRQ(ierr); 14501e0482f5SStefano Zampini ierr = MatView(pcbddc->nedcG,NULL);CHKERRQ(ierr); 14511e0482f5SStefano Zampini #endif 14521e0482f5SStefano Zampini } 1453a13144ffSStefano Zampini 1454a13144ffSStefano Zampini /* set change of basis */ 1455213b8bfaSStefano Zampini ierr = PCBDDCSetChangeOfBasisMat(pc,T,singular);CHKERRQ(ierr); 1456a13144ffSStefano Zampini ierr = MatDestroy(&T);CHKERRQ(ierr); 1457a13144ffSStefano Zampini 1458a13144ffSStefano Zampini PetscFunctionReturn(0); 1459a13144ffSStefano Zampini } 1460a13144ffSStefano Zampini 1461d8203eabSStefano Zampini /* the near-null space of BDDC carries information on quadrature weights, 1462d8203eabSStefano Zampini and these can be collinear -> so cheat with MatNullSpaceCreate 1463d8203eabSStefano Zampini and create a suitable set of basis vectors first */ 1464d8203eabSStefano Zampini PetscErrorCode PCBDDCNullSpaceCreate(MPI_Comm comm, PetscBool has_const, PetscInt nvecs, Vec quad_vecs[], MatNullSpace *nnsp) 1465d8203eabSStefano Zampini { 1466d8203eabSStefano Zampini PetscErrorCode ierr; 1467d8203eabSStefano Zampini PetscInt i; 1468d8203eabSStefano Zampini 1469d8203eabSStefano Zampini PetscFunctionBegin; 1470d8203eabSStefano Zampini for (i=0;i<nvecs;i++) { 1471d8203eabSStefano Zampini PetscInt first,last; 1472d8203eabSStefano Zampini 1473d8203eabSStefano Zampini ierr = VecGetOwnershipRange(quad_vecs[i],&first,&last);CHKERRQ(ierr); 147486fa73c5SStefano Zampini if (last-first < 2*nvecs && has_const) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented"); 1475d8203eabSStefano Zampini if (i>=first && i < last) { 1476d8203eabSStefano Zampini PetscScalar *data; 1477d8203eabSStefano Zampini ierr = VecGetArray(quad_vecs[i],&data);CHKERRQ(ierr); 1478d8203eabSStefano Zampini if (!has_const) { 1479d8203eabSStefano Zampini data[i-first] = 1.; 1480d8203eabSStefano Zampini } else { 148186fa73c5SStefano Zampini data[2*i-first] = 1./PetscSqrtReal(2.); 148286fa73c5SStefano Zampini data[2*i-first+1] = -1./PetscSqrtReal(2.); 1483d8203eabSStefano Zampini } 1484d8203eabSStefano Zampini ierr = VecRestoreArray(quad_vecs[i],&data);CHKERRQ(ierr); 1485d8203eabSStefano Zampini } 1486d8203eabSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)quad_vecs[i]);CHKERRQ(ierr); 1487d8203eabSStefano Zampini } 1488d8203eabSStefano Zampini ierr = MatNullSpaceCreate(comm,has_const,nvecs,quad_vecs,nnsp);CHKERRQ(ierr); 1489d8203eabSStefano Zampini for (i=0;i<nvecs;i++) { /* reset vectors */ 1490d8203eabSStefano Zampini PetscInt first,last; 1491ddc40e2cSstefano_zampini ierr = VecLockPop(quad_vecs[i]);CHKERRQ(ierr); 1492d8203eabSStefano Zampini ierr = VecGetOwnershipRange(quad_vecs[i],&first,&last);CHKERRQ(ierr); 1493d8203eabSStefano Zampini if (i>=first && i < last) { 1494d8203eabSStefano Zampini PetscScalar *data; 1495d8203eabSStefano Zampini ierr = VecGetArray(quad_vecs[i],&data);CHKERRQ(ierr); 1496d8203eabSStefano Zampini if (!has_const) { 1497d8203eabSStefano Zampini data[i-first] = 0.; 1498d8203eabSStefano Zampini } else { 149986fa73c5SStefano Zampini data[2*i-first] = 0.; 150086fa73c5SStefano Zampini data[2*i-first+1] = 0.; 1501d8203eabSStefano Zampini } 1502d8203eabSStefano Zampini ierr = VecRestoreArray(quad_vecs[i],&data);CHKERRQ(ierr); 1503d8203eabSStefano Zampini } 1504d8203eabSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)quad_vecs[i]);CHKERRQ(ierr); 1505ddc40e2cSstefano_zampini ierr = VecLockPush(quad_vecs[i]);CHKERRQ(ierr); 1506d8203eabSStefano Zampini } 1507d8203eabSStefano Zampini PetscFunctionReturn(0); 1508d8203eabSStefano Zampini } 1509d8203eabSStefano Zampini 15108ae0ca82SStefano Zampini PetscErrorCode PCBDDCComputeNoNetFlux(Mat A, Mat divudotp, PetscBool transpose, IS vl2l, PCBDDCGraph graph, MatNullSpace *nnsp) 1511669cc0f4SStefano Zampini { 1512a198735bSStefano Zampini Mat loc_divudotp; 1513fa23a32eSStefano Zampini Vec p,v,vins,quad_vec,*quad_vecs; 15148ae0ca82SStefano Zampini ISLocalToGlobalMapping map; 1515669cc0f4SStefano Zampini IS *faces,*edges; 1516669cc0f4SStefano Zampini PetscScalar *vals; 1517669cc0f4SStefano Zampini const PetscScalar *array; 1518669cc0f4SStefano Zampini PetscInt i,maxneighs,lmaxneighs,maxsize,nf,ne; 15191ae86dd6SStefano Zampini PetscMPIInt rank; 1520a198735bSStefano Zampini PetscErrorCode ierr; 1521669cc0f4SStefano Zampini 1522669cc0f4SStefano Zampini PetscFunctionBegin; 1523669cc0f4SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(graph,&nf,&faces,&ne,&edges,NULL);CHKERRQ(ierr); 1524669cc0f4SStefano Zampini if (graph->twodim) { 1525669cc0f4SStefano Zampini lmaxneighs = 2; 1526669cc0f4SStefano Zampini } else { 1527669cc0f4SStefano Zampini lmaxneighs = 1; 1528669cc0f4SStefano Zampini for (i=0;i<ne;i++) { 1529669cc0f4SStefano Zampini const PetscInt *idxs; 1530669cc0f4SStefano Zampini ierr = ISGetIndices(edges[i],&idxs);CHKERRQ(ierr); 1531669cc0f4SStefano Zampini lmaxneighs = PetscMax(lmaxneighs,graph->count[idxs[0]]); 1532669cc0f4SStefano Zampini ierr = ISRestoreIndices(edges[i],&idxs);CHKERRQ(ierr); 1533669cc0f4SStefano Zampini } 1534669cc0f4SStefano Zampini lmaxneighs++; /* graph count does not include self */ 1535669cc0f4SStefano Zampini } 1536669cc0f4SStefano Zampini ierr = MPIU_Allreduce(&lmaxneighs,&maxneighs,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)A));CHKERRQ(ierr); 1537669cc0f4SStefano Zampini maxsize = 0; 1538669cc0f4SStefano Zampini for (i=0;i<ne;i++) { 1539669cc0f4SStefano Zampini PetscInt nn; 1540669cc0f4SStefano Zampini ierr = ISGetLocalSize(edges[i],&nn);CHKERRQ(ierr); 1541669cc0f4SStefano Zampini maxsize = PetscMax(maxsize,nn); 1542669cc0f4SStefano Zampini } 1543669cc0f4SStefano Zampini for (i=0;i<nf;i++) { 1544669cc0f4SStefano Zampini PetscInt nn; 1545669cc0f4SStefano Zampini ierr = ISGetLocalSize(faces[i],&nn);CHKERRQ(ierr); 1546669cc0f4SStefano Zampini maxsize = PetscMax(maxsize,nn); 1547669cc0f4SStefano Zampini } 1548669cc0f4SStefano Zampini ierr = PetscMalloc1(maxsize,&vals);CHKERRQ(ierr); 1549669cc0f4SStefano Zampini /* create vectors to hold quadrature weights */ 1550669cc0f4SStefano Zampini ierr = MatCreateVecs(A,&quad_vec,NULL);CHKERRQ(ierr); 15518ae0ca82SStefano Zampini if (!transpose) { 15528ae0ca82SStefano Zampini ierr = MatGetLocalToGlobalMapping(A,&map,NULL);CHKERRQ(ierr); 15538ae0ca82SStefano Zampini } else { 15548ae0ca82SStefano Zampini ierr = MatGetLocalToGlobalMapping(A,NULL,&map);CHKERRQ(ierr); 15558ae0ca82SStefano Zampini } 1556669cc0f4SStefano Zampini ierr = VecDuplicateVecs(quad_vec,maxneighs,&quad_vecs);CHKERRQ(ierr); 15571ae86dd6SStefano Zampini ierr = VecDestroy(&quad_vec);CHKERRQ(ierr); 1558d8203eabSStefano Zampini ierr = PCBDDCNullSpaceCreate(PetscObjectComm((PetscObject)A),PETSC_FALSE,maxneighs,quad_vecs,nnsp);CHKERRQ(ierr); 1559669cc0f4SStefano Zampini for (i=0;i<maxneighs;i++) { 1560ddc40e2cSstefano_zampini ierr = VecLockPop(quad_vecs[i]);CHKERRQ(ierr); 15618ae0ca82SStefano Zampini ierr = VecSetLocalToGlobalMapping(quad_vecs[i],map);CHKERRQ(ierr); 1562669cc0f4SStefano Zampini } 1563d8203eabSStefano Zampini 1564669cc0f4SStefano Zampini /* compute local quad vec */ 1565a198735bSStefano Zampini ierr = MatISGetLocalMat(divudotp,&loc_divudotp);CHKERRQ(ierr); 15668ae0ca82SStefano Zampini if (!transpose) { 1567a198735bSStefano Zampini ierr = MatCreateVecs(loc_divudotp,&v,&p);CHKERRQ(ierr); 15688ae0ca82SStefano Zampini } else { 15698ae0ca82SStefano Zampini ierr = MatCreateVecs(loc_divudotp,&p,&v);CHKERRQ(ierr); 15708ae0ca82SStefano Zampini } 1571669cc0f4SStefano Zampini ierr = VecSet(p,1.);CHKERRQ(ierr); 15728ae0ca82SStefano Zampini if (!transpose) { 1573a198735bSStefano Zampini ierr = MatMultTranspose(loc_divudotp,p,v);CHKERRQ(ierr); 15748ae0ca82SStefano Zampini } else { 15758ae0ca82SStefano Zampini ierr = MatMult(loc_divudotp,p,v);CHKERRQ(ierr); 15768ae0ca82SStefano Zampini } 1577fa23a32eSStefano Zampini if (vl2l) { 1578187c917aSStefano Zampini Mat lA; 1579187c917aSStefano Zampini VecScatter sc; 1580187c917aSStefano Zampini 1581187c917aSStefano Zampini ierr = MatISGetLocalMat(A,&lA);CHKERRQ(ierr); 1582187c917aSStefano Zampini ierr = MatCreateVecs(lA,&vins,NULL);CHKERRQ(ierr); 1583187c917aSStefano Zampini ierr = VecScatterCreate(v,vl2l,vins,NULL,&sc);CHKERRQ(ierr); 1584187c917aSStefano Zampini ierr = VecScatterBegin(sc,v,vins,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1585187c917aSStefano Zampini ierr = VecScatterEnd(sc,v,vins,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1586187c917aSStefano Zampini ierr = VecScatterDestroy(&sc);CHKERRQ(ierr); 1587fa23a32eSStefano Zampini } else { 1588fa23a32eSStefano Zampini vins = v; 1589fa23a32eSStefano Zampini } 1590fa23a32eSStefano Zampini ierr = VecGetArrayRead(vins,&array);CHKERRQ(ierr); 1591669cc0f4SStefano Zampini ierr = VecDestroy(&p);CHKERRQ(ierr); 15929a962809SStefano Zampini 15931ae86dd6SStefano Zampini /* insert in global quadrature vecs */ 15941ae86dd6SStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A),&rank);CHKERRQ(ierr); 1595669cc0f4SStefano Zampini for (i=0;i<nf;i++) { 1596669cc0f4SStefano Zampini const PetscInt *idxs; 1597669cc0f4SStefano Zampini PetscInt idx,nn,j; 1598669cc0f4SStefano Zampini 1599669cc0f4SStefano Zampini ierr = ISGetIndices(faces[i],&idxs);CHKERRQ(ierr); 1600669cc0f4SStefano Zampini ierr = ISGetLocalSize(faces[i],&nn);CHKERRQ(ierr); 1601669cc0f4SStefano Zampini for (j=0;j<nn;j++) vals[j] = array[idxs[j]]; 16021ae86dd6SStefano Zampini ierr = PetscFindInt(rank,graph->count[idxs[0]],graph->neighbours_set[idxs[0]],&idx);CHKERRQ(ierr); 1603669cc0f4SStefano Zampini idx = -(idx+1); 1604669cc0f4SStefano Zampini ierr = VecSetValuesLocal(quad_vecs[idx],nn,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 1605669cc0f4SStefano Zampini ierr = ISRestoreIndices(faces[i],&idxs);CHKERRQ(ierr); 1606669cc0f4SStefano Zampini } 1607669cc0f4SStefano Zampini for (i=0;i<ne;i++) { 1608669cc0f4SStefano Zampini const PetscInt *idxs; 1609669cc0f4SStefano Zampini PetscInt idx,nn,j; 1610669cc0f4SStefano Zampini 1611669cc0f4SStefano Zampini ierr = ISGetIndices(edges[i],&idxs);CHKERRQ(ierr); 1612669cc0f4SStefano Zampini ierr = ISGetLocalSize(edges[i],&nn);CHKERRQ(ierr); 1613669cc0f4SStefano Zampini for (j=0;j<nn;j++) vals[j] = array[idxs[j]]; 16141ae86dd6SStefano Zampini ierr = PetscFindInt(rank,graph->count[idxs[0]],graph->neighbours_set[idxs[0]],&idx);CHKERRQ(ierr); 1615669cc0f4SStefano Zampini idx = -(idx+1); 1616669cc0f4SStefano Zampini ierr = VecSetValuesLocal(quad_vecs[idx],nn,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 1617669cc0f4SStefano Zampini ierr = ISRestoreIndices(edges[i],&idxs);CHKERRQ(ierr); 1618669cc0f4SStefano Zampini } 1619c8272957SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(graph,&nf,&faces,&ne,&edges,NULL);CHKERRQ(ierr); 1620fa23a32eSStefano Zampini ierr = VecRestoreArrayRead(vins,&array);CHKERRQ(ierr); 1621fa23a32eSStefano Zampini if (vl2l) { 1622187c917aSStefano Zampini ierr = VecDestroy(&vins);CHKERRQ(ierr); 1623fa23a32eSStefano Zampini } 1624669cc0f4SStefano Zampini ierr = VecDestroy(&v);CHKERRQ(ierr); 1625669cc0f4SStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 1626669cc0f4SStefano Zampini 1627669cc0f4SStefano Zampini /* assemble near null space */ 1628669cc0f4SStefano Zampini for (i=0;i<maxneighs;i++) { 1629669cc0f4SStefano Zampini ierr = VecAssemblyBegin(quad_vecs[i]);CHKERRQ(ierr); 1630669cc0f4SStefano Zampini } 1631669cc0f4SStefano Zampini for (i=0;i<maxneighs;i++) { 1632669cc0f4SStefano Zampini ierr = VecAssemblyEnd(quad_vecs[i]);CHKERRQ(ierr); 1633ddc40e2cSstefano_zampini ierr = VecLockPush(quad_vecs[i]);CHKERRQ(ierr); 1634669cc0f4SStefano Zampini } 1635669cc0f4SStefano Zampini ierr = VecDestroyVecs(maxneighs,&quad_vecs);CHKERRQ(ierr); 1636669cc0f4SStefano Zampini PetscFunctionReturn(0); 1637669cc0f4SStefano Zampini } 1638669cc0f4SStefano Zampini 1639669cc0f4SStefano Zampini 16401f4df5f7SStefano Zampini PetscErrorCode PCBDDCComputeLocalTopologyInfo(PC pc) 16411f4df5f7SStefano Zampini { 16421f4df5f7SStefano Zampini PetscErrorCode ierr; 16431f4df5f7SStefano Zampini Vec local,global; 16441f4df5f7SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 16451f4df5f7SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 16465c5e10d6SStefano Zampini PetscBool monolithic = PETSC_FALSE; 16471f4df5f7SStefano Zampini 16481f4df5f7SStefano Zampini PetscFunctionBegin; 16495c5e10d6SStefano Zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC topology options","PC");CHKERRQ(ierr); 16505c5e10d6SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_monolithic","Discard any information on dofs splitting",NULL,monolithic,&monolithic,NULL);CHKERRQ(ierr); 16515c5e10d6SStefano Zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 16521f4df5f7SStefano Zampini /* need to convert from global to local topology information and remove references to information in global ordering */ 165321ef3d20SStefano Zampini ierr = MatCreateVecs(pc->pmat,&global,NULL);CHKERRQ(ierr); 16541f4df5f7SStefano Zampini ierr = MatCreateVecs(matis->A,&local,NULL);CHKERRQ(ierr); 16555c5e10d6SStefano Zampini if (monolithic) goto boundary; 16565c5e10d6SStefano Zampini 16571f4df5f7SStefano Zampini if (pcbddc->user_provided_isfordofs) { 16581f4df5f7SStefano Zampini if (pcbddc->n_ISForDofs) { 16591f4df5f7SStefano Zampini PetscInt i; 16601f4df5f7SStefano Zampini ierr = PetscMalloc1(pcbddc->n_ISForDofs,&pcbddc->ISForDofsLocal);CHKERRQ(ierr); 16611f4df5f7SStefano Zampini for (i=0;i<pcbddc->n_ISForDofs;i++) { 16621f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->ISForDofs[i],&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 16631f4df5f7SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 16641f4df5f7SStefano Zampini } 16651f4df5f7SStefano Zampini pcbddc->n_ISForDofsLocal = pcbddc->n_ISForDofs; 16661f4df5f7SStefano Zampini pcbddc->n_ISForDofs = 0; 16671f4df5f7SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 16681f4df5f7SStefano Zampini } 16691f4df5f7SStefano Zampini } else { 167021ef3d20SStefano Zampini if (!pcbddc->n_ISForDofsLocal) { /* field split not present */ 167121ef3d20SStefano Zampini DM dm; 167221ef3d20SStefano Zampini 167321ef3d20SStefano Zampini ierr = PCGetDM(pc, &dm);CHKERRQ(ierr); 167421ef3d20SStefano Zampini if (!dm) { 167521ef3d20SStefano Zampini ierr = MatGetDM(pc->pmat, &dm);CHKERRQ(ierr); 167621ef3d20SStefano Zampini } 167721ef3d20SStefano Zampini if (dm) { 167821ef3d20SStefano Zampini IS *fields; 167921ef3d20SStefano Zampini PetscInt nf,i; 168021ef3d20SStefano Zampini ierr = DMCreateFieldDecomposition(dm,&nf,NULL,&fields,NULL);CHKERRQ(ierr); 168121ef3d20SStefano Zampini ierr = PetscMalloc1(nf,&pcbddc->ISForDofsLocal);CHKERRQ(ierr); 168221ef3d20SStefano Zampini for (i=0;i<nf;i++) { 168321ef3d20SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,fields[i],&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 168421ef3d20SStefano Zampini ierr = ISDestroy(&fields[i]);CHKERRQ(ierr); 168521ef3d20SStefano Zampini } 168621ef3d20SStefano Zampini ierr = PetscFree(fields);CHKERRQ(ierr); 168721ef3d20SStefano Zampini pcbddc->n_ISForDofsLocal = nf; 168821ef3d20SStefano Zampini } else { /* See if MATIS has fields attached by the conversion from MatNest */ 168921ef3d20SStefano Zampini PetscContainer c; 169021ef3d20SStefano Zampini 169121ef3d20SStefano Zampini ierr = PetscObjectQuery((PetscObject)pc->pmat,"_convert_nest_lfields",(PetscObject*)&c);CHKERRQ(ierr); 169221ef3d20SStefano Zampini if (c) { 169321ef3d20SStefano Zampini MatISLocalFields lf; 169421ef3d20SStefano Zampini ierr = PetscContainerGetPointer(c,(void**)&lf);CHKERRQ(ierr); 169521ef3d20SStefano Zampini ierr = PCBDDCSetDofsSplittingLocal(pc,lf->nr,lf->rf);CHKERRQ(ierr); 169621ef3d20SStefano Zampini } else { /* fallback, create the default fields if bs > 1 */ 16971f4df5f7SStefano Zampini PetscInt i, n = matis->A->rmap->n; 1698986cdee1SStefano Zampini ierr = MatGetBlockSize(pc->pmat,&i);CHKERRQ(ierr); 169921ef3d20SStefano Zampini if (i > 1) { 1700986cdee1SStefano Zampini pcbddc->n_ISForDofsLocal = i; 17011f4df5f7SStefano Zampini ierr = PetscMalloc1(pcbddc->n_ISForDofsLocal,&pcbddc->ISForDofsLocal);CHKERRQ(ierr); 17021f4df5f7SStefano Zampini for (i=0;i<pcbddc->n_ISForDofsLocal;i++) { 17031f4df5f7SStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n/pcbddc->n_ISForDofsLocal,i,pcbddc->n_ISForDofsLocal,&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 17041f4df5f7SStefano Zampini } 17051f4df5f7SStefano Zampini } 170621ef3d20SStefano Zampini } 170721ef3d20SStefano Zampini } 17087a0e7b2cSstefano_zampini } else { 17097a0e7b2cSstefano_zampini PetscInt i; 17107a0e7b2cSstefano_zampini for (i=0;i<pcbddc->n_ISForDofsLocal;i++) { 17117a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LAND,&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 17127a0e7b2cSstefano_zampini } 17131f4df5f7SStefano Zampini } 1714986cdee1SStefano Zampini } 17151f4df5f7SStefano Zampini 17165c5e10d6SStefano Zampini boundary: 17171f4df5f7SStefano Zampini if (!pcbddc->DirichletBoundariesLocal && pcbddc->DirichletBoundaries) { 17181f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->DirichletBoundaries,&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr); 17197a0e7b2cSstefano_zampini } else if (pcbddc->DirichletBoundariesLocal) { 17207a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LAND,&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr); 17211f4df5f7SStefano Zampini } 17221f4df5f7SStefano Zampini if (!pcbddc->NeumannBoundariesLocal && pcbddc->NeumannBoundaries) { 17231f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->NeumannBoundaries,&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr); 17247a0e7b2cSstefano_zampini } else if (pcbddc->NeumannBoundariesLocal) { 17257a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LOR,&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr); 17261f4df5f7SStefano Zampini } 17271f4df5f7SStefano Zampini if (!pcbddc->user_primal_vertices_local && pcbddc->user_primal_vertices) { 17281f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->user_primal_vertices,&pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 17291f4df5f7SStefano Zampini } 17301f4df5f7SStefano Zampini ierr = VecDestroy(&global);CHKERRQ(ierr); 17311f4df5f7SStefano Zampini ierr = VecDestroy(&local);CHKERRQ(ierr); 17327a0e7b2cSstefano_zampini 17337a0e7b2cSstefano_zampini PetscFunctionReturn(0); 17347a0e7b2cSstefano_zampini } 17357a0e7b2cSstefano_zampini 17367a0e7b2cSstefano_zampini PetscErrorCode PCBDDCConsistencyCheckIS(PC pc, MPI_Op mop, IS *is) 17377a0e7b2cSstefano_zampini { 17387a0e7b2cSstefano_zampini Mat_IS *matis = (Mat_IS*)(pc->pmat->data); 17397a0e7b2cSstefano_zampini PetscErrorCode ierr; 17407a0e7b2cSstefano_zampini IS nis; 17417a0e7b2cSstefano_zampini const PetscInt *idxs; 17427a0e7b2cSstefano_zampini PetscInt i,nd,n = matis->A->rmap->n,*nidxs,nnd; 17437a0e7b2cSstefano_zampini PetscBool *ld; 17447a0e7b2cSstefano_zampini 17457a0e7b2cSstefano_zampini PetscFunctionBegin; 17467a0e7b2cSstefano_zampini if (mop != MPI_LAND && mop != MPI_LOR) SETERRQ(PetscObjectComm((PetscObject)(pc)),PETSC_ERR_SUP,"Supported are MPI_LAND and MPI_LOR"); 17477a0e7b2cSstefano_zampini ierr = MatISSetUpSF(pc->pmat);CHKERRQ(ierr); 17487a0e7b2cSstefano_zampini if (mop == MPI_LAND) { 17497a0e7b2cSstefano_zampini /* init rootdata with true */ 17507a0e7b2cSstefano_zampini ld = (PetscBool*) matis->sf_rootdata; 17517a0e7b2cSstefano_zampini for (i=0;i<pc->pmat->rmap->n;i++) ld[i] = PETSC_TRUE; 17527a0e7b2cSstefano_zampini } else { 17537a0e7b2cSstefano_zampini ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscBool));CHKERRQ(ierr); 17547a0e7b2cSstefano_zampini } 17557a0e7b2cSstefano_zampini ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscBool));CHKERRQ(ierr); 17567a0e7b2cSstefano_zampini ierr = ISGetLocalSize(*is,&nd);CHKERRQ(ierr); 17577a0e7b2cSstefano_zampini ierr = ISGetIndices(*is,&idxs);CHKERRQ(ierr); 17587a0e7b2cSstefano_zampini ld = (PetscBool*) matis->sf_leafdata; 17597a0e7b2cSstefano_zampini for (i=0;i<nd;i++) 17607a0e7b2cSstefano_zampini if (-1 < idxs[i] && idxs[i] < n) 17617a0e7b2cSstefano_zampini ld[idxs[i]] = PETSC_TRUE; 17627a0e7b2cSstefano_zampini ierr = ISRestoreIndices(*is,&idxs);CHKERRQ(ierr); 17637a0e7b2cSstefano_zampini ierr = PetscSFReduceBegin(matis->sf,MPIU_BOOL,matis->sf_leafdata,matis->sf_rootdata,mop);CHKERRQ(ierr); 17647a0e7b2cSstefano_zampini ierr = PetscSFReduceEnd(matis->sf,MPIU_BOOL,matis->sf_leafdata,matis->sf_rootdata,mop);CHKERRQ(ierr); 17657a0e7b2cSstefano_zampini ierr = PetscSFBcastBegin(matis->sf,MPIU_BOOL,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 17667a0e7b2cSstefano_zampini ierr = PetscSFBcastEnd(matis->sf,MPIU_BOOL,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 17677a0e7b2cSstefano_zampini if (mop == MPI_LAND) { 17687a0e7b2cSstefano_zampini ierr = PetscMalloc1(nd,&nidxs);CHKERRQ(ierr); 17697a0e7b2cSstefano_zampini } else { 17707a0e7b2cSstefano_zampini ierr = PetscMalloc1(n,&nidxs);CHKERRQ(ierr); 17717a0e7b2cSstefano_zampini } 17727a0e7b2cSstefano_zampini for (i=0,nnd=0;i<n;i++) 17737a0e7b2cSstefano_zampini if (ld[i]) 17747a0e7b2cSstefano_zampini nidxs[nnd++] = i; 17757a0e7b2cSstefano_zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(*is)),nnd,nidxs,PETSC_OWN_POINTER,&nis);CHKERRQ(ierr); 17767a0e7b2cSstefano_zampini ierr = ISDestroy(is);CHKERRQ(ierr); 17777a0e7b2cSstefano_zampini *is = nis; 17781f4df5f7SStefano Zampini PetscFunctionReturn(0); 17791f4df5f7SStefano Zampini } 17801f4df5f7SStefano Zampini 17813e589ea0SStefano Zampini PetscErrorCode PCBDDCBenignRemoveInterior(PC pc,Vec r,Vec z) 17823e589ea0SStefano Zampini { 17833e589ea0SStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 17843e589ea0SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 17853e589ea0SStefano Zampini PetscErrorCode ierr; 17863e589ea0SStefano Zampini 17873e589ea0SStefano Zampini PetscFunctionBegin; 17883e589ea0SStefano Zampini if (!pcbddc->benign_have_null) { 17893e589ea0SStefano Zampini PetscFunctionReturn(0); 17903e589ea0SStefano Zampini } 17913e589ea0SStefano Zampini if (pcbddc->ChangeOfBasisMatrix) { 17923e589ea0SStefano Zampini Vec swap; 17933e589ea0SStefano Zampini 17943e589ea0SStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,r,pcbddc->work_change);CHKERRQ(ierr); 17953e589ea0SStefano Zampini swap = pcbddc->work_change; 17963e589ea0SStefano Zampini pcbddc->work_change = r; 17973e589ea0SStefano Zampini r = swap; 17983e589ea0SStefano Zampini } 17993e589ea0SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18003e589ea0SStefano Zampini ierr = VecScatterEnd(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18013e589ea0SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 18023e589ea0SStefano Zampini ierr = VecSet(z,0.);CHKERRQ(ierr); 18033e589ea0SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18043e589ea0SStefano Zampini ierr = VecScatterEnd(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18053e589ea0SStefano Zampini if (pcbddc->ChangeOfBasisMatrix) { 1806f913dca9SStefano Zampini pcbddc->work_change = r; 18073e589ea0SStefano Zampini ierr = VecCopy(z,pcbddc->work_change);CHKERRQ(ierr); 18083e589ea0SStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcbddc->work_change,z);CHKERRQ(ierr); 18093e589ea0SStefano Zampini } 18103e589ea0SStefano Zampini PetscFunctionReturn(0); 18113e589ea0SStefano Zampini } 18123e589ea0SStefano Zampini 1813a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMult_Private_Private(Mat A, Vec x, Vec y, PetscBool transpose) 1814a3df083aSStefano Zampini { 1815a3df083aSStefano Zampini PCBDDCBenignMatMult_ctx ctx; 1816a3df083aSStefano Zampini PetscErrorCode ierr; 1817a3df083aSStefano Zampini PetscBool apply_right,apply_left,reset_x; 1818a3df083aSStefano Zampini 1819a3df083aSStefano Zampini PetscFunctionBegin; 1820a3df083aSStefano Zampini ierr = MatShellGetContext(A,&ctx);CHKERRQ(ierr); 1821a3df083aSStefano Zampini if (transpose) { 1822a3df083aSStefano Zampini apply_right = ctx->apply_left; 1823a3df083aSStefano Zampini apply_left = ctx->apply_right; 1824a3df083aSStefano Zampini } else { 1825a3df083aSStefano Zampini apply_right = ctx->apply_right; 1826a3df083aSStefano Zampini apply_left = ctx->apply_left; 1827a3df083aSStefano Zampini } 1828a3df083aSStefano Zampini reset_x = PETSC_FALSE; 1829a3df083aSStefano Zampini if (apply_right) { 1830a3df083aSStefano Zampini const PetscScalar *ax; 1831a3df083aSStefano Zampini PetscInt nl,i; 1832a3df083aSStefano Zampini 1833a3df083aSStefano Zampini ierr = VecGetLocalSize(x,&nl);CHKERRQ(ierr); 1834a3df083aSStefano Zampini ierr = VecGetArrayRead(x,&ax);CHKERRQ(ierr); 1835a3df083aSStefano Zampini ierr = PetscMemcpy(ctx->work,ax,nl*sizeof(PetscScalar));CHKERRQ(ierr); 1836a3df083aSStefano Zampini ierr = VecRestoreArrayRead(x,&ax);CHKERRQ(ierr); 1837a3df083aSStefano Zampini for (i=0;i<ctx->benign_n;i++) { 1838a3df083aSStefano Zampini PetscScalar sum,val; 1839a3df083aSStefano Zampini const PetscInt *idxs; 1840a3df083aSStefano Zampini PetscInt nz,j; 1841a3df083aSStefano Zampini ierr = ISGetLocalSize(ctx->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 1842a3df083aSStefano Zampini ierr = ISGetIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1843a3df083aSStefano Zampini sum = 0.; 1844a3df083aSStefano Zampini if (ctx->apply_p0) { 1845a3df083aSStefano Zampini val = ctx->work[idxs[nz-1]]; 1846a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1847a3df083aSStefano Zampini sum += ctx->work[idxs[j]]; 1848a3df083aSStefano Zampini ctx->work[idxs[j]] += val; 1849a3df083aSStefano Zampini } 1850a3df083aSStefano Zampini } else { 1851a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1852a3df083aSStefano Zampini sum += ctx->work[idxs[j]]; 1853a3df083aSStefano Zampini } 1854a3df083aSStefano Zampini } 1855a3df083aSStefano Zampini ctx->work[idxs[nz-1]] -= sum; 1856a3df083aSStefano Zampini ierr = ISRestoreIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1857a3df083aSStefano Zampini } 1858a3df083aSStefano Zampini ierr = VecPlaceArray(x,ctx->work);CHKERRQ(ierr); 1859a3df083aSStefano Zampini reset_x = PETSC_TRUE; 1860a3df083aSStefano Zampini } 1861a3df083aSStefano Zampini if (transpose) { 1862a3df083aSStefano Zampini ierr = MatMultTranspose(ctx->A,x,y);CHKERRQ(ierr); 1863a3df083aSStefano Zampini } else { 1864a3df083aSStefano Zampini ierr = MatMult(ctx->A,x,y);CHKERRQ(ierr); 1865a3df083aSStefano Zampini } 1866a3df083aSStefano Zampini if (reset_x) { 1867a3df083aSStefano Zampini ierr = VecResetArray(x);CHKERRQ(ierr); 1868a3df083aSStefano Zampini } 1869a3df083aSStefano Zampini if (apply_left) { 1870a3df083aSStefano Zampini PetscScalar *ay; 1871a3df083aSStefano Zampini PetscInt i; 1872a3df083aSStefano Zampini 1873a3df083aSStefano Zampini ierr = VecGetArray(y,&ay);CHKERRQ(ierr); 1874a3df083aSStefano Zampini for (i=0;i<ctx->benign_n;i++) { 1875a3df083aSStefano Zampini PetscScalar sum,val; 1876a3df083aSStefano Zampini const PetscInt *idxs; 1877a3df083aSStefano Zampini PetscInt nz,j; 1878a3df083aSStefano Zampini ierr = ISGetLocalSize(ctx->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 1879a3df083aSStefano Zampini ierr = ISGetIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1880a3df083aSStefano Zampini val = -ay[idxs[nz-1]]; 1881a3df083aSStefano Zampini if (ctx->apply_p0) { 1882a3df083aSStefano Zampini sum = 0.; 1883a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1884a3df083aSStefano Zampini sum += ay[idxs[j]]; 1885a3df083aSStefano Zampini ay[idxs[j]] += val; 1886a3df083aSStefano Zampini } 1887a3df083aSStefano Zampini ay[idxs[nz-1]] += sum; 1888a3df083aSStefano Zampini } else { 1889a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1890a3df083aSStefano Zampini ay[idxs[j]] += val; 1891a3df083aSStefano Zampini } 1892a3df083aSStefano Zampini ay[idxs[nz-1]] = 0.; 1893a3df083aSStefano Zampini } 1894a3df083aSStefano Zampini ierr = ISRestoreIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1895a3df083aSStefano Zampini } 1896a3df083aSStefano Zampini ierr = VecRestoreArray(y,&ay);CHKERRQ(ierr); 1897a3df083aSStefano Zampini } 1898a3df083aSStefano Zampini PetscFunctionReturn(0); 1899a3df083aSStefano Zampini } 1900a3df083aSStefano Zampini 1901a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMultTranspose_Private(Mat A, Vec x, Vec y) 1902a3df083aSStefano Zampini { 1903a3df083aSStefano Zampini PetscErrorCode ierr; 1904a3df083aSStefano Zampini 1905a3df083aSStefano Zampini PetscFunctionBegin; 1906a3df083aSStefano Zampini ierr = PCBDDCBenignMatMult_Private_Private(A,x,y,PETSC_TRUE);CHKERRQ(ierr); 1907a3df083aSStefano Zampini PetscFunctionReturn(0); 1908a3df083aSStefano Zampini } 1909a3df083aSStefano Zampini 1910a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMult_Private(Mat A, Vec x, Vec y) 1911a3df083aSStefano Zampini { 1912a3df083aSStefano Zampini PetscErrorCode ierr; 1913a3df083aSStefano Zampini 1914a3df083aSStefano Zampini PetscFunctionBegin; 1915a3df083aSStefano Zampini ierr = PCBDDCBenignMatMult_Private_Private(A,x,y,PETSC_FALSE);CHKERRQ(ierr); 1916a3df083aSStefano Zampini PetscFunctionReturn(0); 1917a3df083aSStefano Zampini } 1918a3df083aSStefano Zampini 1919a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignShellMat(PC pc, PetscBool restore) 1920a3df083aSStefano Zampini { 1921a3df083aSStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 1922a3df083aSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1923a3df083aSStefano Zampini PCBDDCBenignMatMult_ctx ctx; 1924a3df083aSStefano Zampini PetscErrorCode ierr; 1925a3df083aSStefano Zampini 1926a3df083aSStefano Zampini PetscFunctionBegin; 1927a3df083aSStefano Zampini if (!restore) { 19281dd7afcfSStefano Zampini Mat A_IB,A_BI; 1929a3df083aSStefano Zampini PetscScalar *work; 1930b334f244SStefano Zampini PCBDDCReuseSolvers reuse = pcbddc->sub_schurs ? pcbddc->sub_schurs->reuse_solver : NULL; 1931a3df083aSStefano Zampini 19329a962809SStefano Zampini if (pcbddc->benign_original_mat) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Benign original mat has not been restored"); 19339a962809SStefano Zampini if (!pcbddc->benign_change || !pcbddc->benign_n || pcbddc->benign_change_explicit) PetscFunctionReturn(0); 1934a3df083aSStefano Zampini ierr = PetscMalloc1(pcis->n,&work);CHKERRQ(ierr); 1935a3df083aSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&A_IB);CHKERRQ(ierr); 1936a3df083aSStefano Zampini ierr = MatSetSizes(A_IB,pcis->n-pcis->n_B,pcis->n_B,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 1937a3df083aSStefano Zampini ierr = MatSetType(A_IB,MATSHELL);CHKERRQ(ierr); 1938a3df083aSStefano Zampini ierr = MatShellSetOperation(A_IB,MATOP_MULT,(void (*)(void))PCBDDCBenignMatMult_Private);CHKERRQ(ierr); 1939a3df083aSStefano Zampini ierr = MatShellSetOperation(A_IB,MATOP_MULT_TRANSPOSE,(void (*)(void))PCBDDCBenignMatMultTranspose_Private);CHKERRQ(ierr); 1940a3df083aSStefano Zampini ierr = PetscNew(&ctx);CHKERRQ(ierr); 1941a3df083aSStefano Zampini ierr = MatShellSetContext(A_IB,ctx);CHKERRQ(ierr); 1942a3df083aSStefano Zampini ctx->apply_left = PETSC_TRUE; 1943a3df083aSStefano Zampini ctx->apply_right = PETSC_FALSE; 1944a3df083aSStefano Zampini ctx->apply_p0 = PETSC_FALSE; 1945a3df083aSStefano Zampini ctx->benign_n = pcbddc->benign_n; 1946059032f7SStefano Zampini if (reuse) { 1947a3df083aSStefano Zampini ctx->benign_zerodiag_subs = reuse->benign_zerodiag_subs; 19481dd7afcfSStefano Zampini ctx->free = PETSC_FALSE; 1949059032f7SStefano Zampini } else { /* TODO: could be optimized for successive solves */ 1950059032f7SStefano Zampini ISLocalToGlobalMapping N_to_D; 1951059032f7SStefano Zampini PetscInt i; 1952059032f7SStefano Zampini 1953059032f7SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(pcis->is_I_local,&N_to_D);CHKERRQ(ierr); 1954059032f7SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&ctx->benign_zerodiag_subs);CHKERRQ(ierr); 1955059032f7SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 1956059032f7SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(N_to_D,IS_GTOLM_DROP,pcbddc->benign_zerodiag_subs[i],&ctx->benign_zerodiag_subs[i]);CHKERRQ(ierr); 1957059032f7SStefano Zampini } 1958059032f7SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&N_to_D);CHKERRQ(ierr); 19591dd7afcfSStefano Zampini ctx->free = PETSC_TRUE; 1960059032f7SStefano Zampini } 1961a3df083aSStefano Zampini ctx->A = pcis->A_IB; 1962a3df083aSStefano Zampini ctx->work = work; 1963a3df083aSStefano Zampini ierr = MatSetUp(A_IB);CHKERRQ(ierr); 1964a3df083aSStefano Zampini ierr = MatAssemblyBegin(A_IB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1965a3df083aSStefano Zampini ierr = MatAssemblyEnd(A_IB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1966a3df083aSStefano Zampini pcis->A_IB = A_IB; 1967a3df083aSStefano Zampini 1968a3df083aSStefano Zampini /* A_BI as A_IB^T */ 1969a3df083aSStefano Zampini ierr = MatCreateTranspose(A_IB,&A_BI);CHKERRQ(ierr); 1970a3df083aSStefano Zampini pcbddc->benign_original_mat = pcis->A_BI; 1971a3df083aSStefano Zampini pcis->A_BI = A_BI; 1972a3df083aSStefano Zampini } else { 19731dd7afcfSStefano Zampini if (!pcbddc->benign_original_mat) { 19741dd7afcfSStefano Zampini PetscFunctionReturn(0); 19751dd7afcfSStefano Zampini } 1976a3df083aSStefano Zampini ierr = MatShellGetContext(pcis->A_IB,&ctx);CHKERRQ(ierr); 1977a3df083aSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 1978a3df083aSStefano Zampini pcis->A_IB = ctx->A; 19791dd7afcfSStefano Zampini ctx->A = NULL; 19801dd7afcfSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 19811dd7afcfSStefano Zampini pcis->A_BI = pcbddc->benign_original_mat; 19821dd7afcfSStefano Zampini pcbddc->benign_original_mat = NULL; 19831dd7afcfSStefano Zampini if (ctx->free) { 1984059032f7SStefano Zampini PetscInt i; 19851dd7afcfSStefano Zampini for (i=0;i<ctx->benign_n;i++) { 1986059032f7SStefano Zampini ierr = ISDestroy(&ctx->benign_zerodiag_subs[i]);CHKERRQ(ierr); 1987059032f7SStefano Zampini } 1988059032f7SStefano Zampini ierr = PetscFree(ctx->benign_zerodiag_subs);CHKERRQ(ierr); 1989059032f7SStefano Zampini } 1990a3df083aSStefano Zampini ierr = PetscFree(ctx->work);CHKERRQ(ierr); 1991a3df083aSStefano Zampini ierr = PetscFree(ctx);CHKERRQ(ierr); 1992a3df083aSStefano Zampini } 1993a3df083aSStefano Zampini PetscFunctionReturn(0); 1994a3df083aSStefano Zampini } 1995a3df083aSStefano Zampini 1996a3df083aSStefano Zampini /* used just in bddc debug mode */ 1997a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignProject(PC pc, IS is1, IS is2, Mat *B) 1998a3df083aSStefano Zampini { 1999a3df083aSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2000a3df083aSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2001a3df083aSStefano Zampini Mat An; 2002a3df083aSStefano Zampini PetscErrorCode ierr; 2003a3df083aSStefano Zampini 2004a3df083aSStefano Zampini PetscFunctionBegin; 2005a3df083aSStefano Zampini ierr = MatPtAP(matis->A,pcbddc->benign_change,MAT_INITIAL_MATRIX,2.0,&An);CHKERRQ(ierr); 2006a3df083aSStefano Zampini ierr = MatZeroRowsColumns(An,pcbddc->benign_n,pcbddc->benign_p0_lidx,1.0,NULL,NULL);CHKERRQ(ierr); 2007a3df083aSStefano Zampini if (is1) { 20087dae84e0SHong Zhang ierr = MatCreateSubMatrix(An,is1,is2,MAT_INITIAL_MATRIX,B);CHKERRQ(ierr); 2009a3df083aSStefano Zampini ierr = MatDestroy(&An);CHKERRQ(ierr); 2010a3df083aSStefano Zampini } else { 2011a3df083aSStefano Zampini *B = An; 2012a3df083aSStefano Zampini } 2013a3df083aSStefano Zampini PetscFunctionReturn(0); 2014a3df083aSStefano Zampini } 2015a3df083aSStefano Zampini 20161cf9b237SStefano Zampini /* TODO: add reuse flag */ 20171cf9b237SStefano Zampini PetscErrorCode MatSeqAIJCompress(Mat A, Mat *B) 20181cf9b237SStefano Zampini { 20191cf9b237SStefano Zampini Mat Bt; 20201cf9b237SStefano Zampini PetscScalar *a,*bdata; 20211cf9b237SStefano Zampini const PetscInt *ii,*ij; 20221cf9b237SStefano Zampini PetscInt m,n,i,nnz,*bii,*bij; 20231cf9b237SStefano Zampini PetscBool flg_row; 20241cf9b237SStefano Zampini PetscErrorCode ierr; 20251cf9b237SStefano Zampini 20261cf9b237SStefano Zampini PetscFunctionBegin; 20271cf9b237SStefano Zampini ierr = MatGetSize(A,&n,&m);CHKERRQ(ierr); 20281cf9b237SStefano Zampini ierr = MatGetRowIJ(A,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&ij,&flg_row);CHKERRQ(ierr); 20291cf9b237SStefano Zampini ierr = MatSeqAIJGetArray(A,&a);CHKERRQ(ierr); 20301cf9b237SStefano Zampini nnz = n; 20311cf9b237SStefano Zampini for (i=0;i<ii[n];i++) { 20321cf9b237SStefano Zampini if (PetscLikely(PetscAbsScalar(a[i]) > PETSC_SMALL)) nnz++; 20331cf9b237SStefano Zampini } 20341cf9b237SStefano Zampini ierr = PetscMalloc1(n+1,&bii);CHKERRQ(ierr); 20351cf9b237SStefano Zampini ierr = PetscMalloc1(nnz,&bij);CHKERRQ(ierr); 20361cf9b237SStefano Zampini ierr = PetscMalloc1(nnz,&bdata);CHKERRQ(ierr); 20371cf9b237SStefano Zampini nnz = 0; 20381cf9b237SStefano Zampini bii[0] = 0; 20391cf9b237SStefano Zampini for (i=0;i<n;i++) { 20401cf9b237SStefano Zampini PetscInt j; 20411cf9b237SStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 20421cf9b237SStefano Zampini PetscScalar entry = a[j]; 20431cf9b237SStefano Zampini if (PetscLikely(PetscAbsScalar(entry) > PETSC_SMALL) || ij[j] == i) { 20441cf9b237SStefano Zampini bij[nnz] = ij[j]; 20451cf9b237SStefano Zampini bdata[nnz] = entry; 20461cf9b237SStefano Zampini nnz++; 20471cf9b237SStefano Zampini } 20481cf9b237SStefano Zampini } 20491cf9b237SStefano Zampini bii[i+1] = nnz; 20501cf9b237SStefano Zampini } 20511cf9b237SStefano Zampini ierr = MatSeqAIJRestoreArray(A,&a);CHKERRQ(ierr); 20521cf9b237SStefano Zampini ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),n,m,bii,bij,bdata,&Bt);CHKERRQ(ierr); 20531cf9b237SStefano Zampini ierr = MatRestoreRowIJ(A,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&ij,&flg_row);CHKERRQ(ierr); 20541cf9b237SStefano Zampini { 20551cf9b237SStefano Zampini Mat_SeqAIJ *b = (Mat_SeqAIJ*)(Bt->data); 20561cf9b237SStefano Zampini b->free_a = PETSC_TRUE; 20571cf9b237SStefano Zampini b->free_ij = PETSC_TRUE; 20581cf9b237SStefano Zampini } 20591cf9b237SStefano Zampini *B = Bt; 20601cf9b237SStefano Zampini PetscFunctionReturn(0); 20611cf9b237SStefano Zampini } 20621cf9b237SStefano Zampini 2063c80a6c00SStefano Zampini PetscErrorCode PCBDDCDetectDisconnectedComponents(PC pc, PetscInt *ncc, IS* cc[], IS* primalv) 20644f1b2e48SStefano Zampini { 2065c80a6c00SStefano Zampini Mat B = NULL; 2066c80a6c00SStefano Zampini DM dm; 20674f1b2e48SStefano Zampini IS is_dummy,*cc_n; 20684f1b2e48SStefano Zampini ISLocalToGlobalMapping l2gmap_dummy; 20694f1b2e48SStefano Zampini PCBDDCGraph graph; 2070c80a6c00SStefano Zampini PetscInt *xadj_filtered = NULL,*adjncy_filtered = NULL; 20714f1b2e48SStefano Zampini PetscInt i,n; 20724f1b2e48SStefano Zampini PetscInt *xadj,*adjncy; 2073c80a6c00SStefano Zampini PetscBool isplex = PETSC_FALSE; 20744f1b2e48SStefano Zampini PetscErrorCode ierr; 20754f1b2e48SStefano Zampini 20764f1b2e48SStefano Zampini PetscFunctionBegin; 2077a2eca866SStefano Zampini if (ncc) *ncc = 0; 2078a2eca866SStefano Zampini if (cc) *cc = NULL; 2079a2eca866SStefano Zampini if (primalv) *primalv = NULL; 2080c80a6c00SStefano Zampini ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr); 2081c80a6c00SStefano Zampini ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 2082c80a6c00SStefano Zampini if (!dm) { 2083c80a6c00SStefano Zampini ierr = MatGetDM(pc->pmat,&dm);CHKERRQ(ierr); 2084c80a6c00SStefano Zampini } 2085c80a6c00SStefano Zampini if (dm) { 2086c80a6c00SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)dm,DMPLEX,&isplex);CHKERRQ(ierr); 2087c80a6c00SStefano Zampini } 2088c80a6c00SStefano Zampini if (isplex) { /* this code has been modified from plexpartition.c */ 2089c80a6c00SStefano Zampini PetscInt p, pStart, pEnd, a, adjSize, idx, size, nroots; 2090c80a6c00SStefano Zampini PetscInt *adj = NULL; 2091c80a6c00SStefano Zampini IS cellNumbering; 2092c80a6c00SStefano Zampini const PetscInt *cellNum; 2093c80a6c00SStefano Zampini PetscBool useCone, useClosure; 2094c80a6c00SStefano Zampini PetscSection section; 2095c80a6c00SStefano Zampini PetscSegBuffer adjBuffer; 2096c80a6c00SStefano Zampini PetscSF sfPoint; 2097c80a6c00SStefano Zampini PetscErrorCode ierr; 2098c80a6c00SStefano Zampini 2099c80a6c00SStefano Zampini PetscFunctionBegin; 2100c80a6c00SStefano Zampini ierr = DMPlexGetHeightStratum(dm, 0, &pStart, &pEnd);CHKERRQ(ierr); 2101c80a6c00SStefano Zampini ierr = DMGetPointSF(dm, &sfPoint);CHKERRQ(ierr); 2102c80a6c00SStefano Zampini ierr = PetscSFGetGraph(sfPoint, &nroots, NULL, NULL, NULL);CHKERRQ(ierr); 2103c80a6c00SStefano Zampini /* Build adjacency graph via a section/segbuffer */ 2104c80a6c00SStefano Zampini ierr = PetscSectionCreate(PetscObjectComm((PetscObject) dm), §ion);CHKERRQ(ierr); 2105c80a6c00SStefano Zampini ierr = PetscSectionSetChart(section, pStart, pEnd);CHKERRQ(ierr); 2106c80a6c00SStefano Zampini ierr = PetscSegBufferCreate(sizeof(PetscInt),1000,&adjBuffer);CHKERRQ(ierr); 2107c80a6c00SStefano Zampini /* Always use FVM adjacency to create partitioner graph */ 2108c80a6c00SStefano Zampini ierr = DMPlexGetAdjacencyUseCone(dm, &useCone);CHKERRQ(ierr); 2109c80a6c00SStefano Zampini ierr = DMPlexGetAdjacencyUseClosure(dm, &useClosure);CHKERRQ(ierr); 2110c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseCone(dm, PETSC_TRUE);CHKERRQ(ierr); 2111c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseClosure(dm, PETSC_FALSE);CHKERRQ(ierr); 2112956e2312SStefano Zampini ierr = DMPlexGetCellNumbering(dm, &cellNumbering);CHKERRQ(ierr); 2113c80a6c00SStefano Zampini ierr = ISGetIndices(cellNumbering, &cellNum);CHKERRQ(ierr); 2114c80a6c00SStefano Zampini for (n = 0, p = pStart; p < pEnd; p++) { 2115c80a6c00SStefano Zampini /* Skip non-owned cells in parallel (ParMetis expects no overlap) */ 2116c80a6c00SStefano Zampini if (nroots > 0) {if (cellNum[p] < 0) continue;} 2117c80a6c00SStefano Zampini adjSize = PETSC_DETERMINE; 2118c80a6c00SStefano Zampini ierr = DMPlexGetAdjacency(dm, p, &adjSize, &adj);CHKERRQ(ierr); 2119c80a6c00SStefano Zampini for (a = 0; a < adjSize; ++a) { 2120c80a6c00SStefano Zampini const PetscInt point = adj[a]; 21215cef3d0dSStefano Zampini if (pStart <= point && point < pEnd) { 2122c80a6c00SStefano Zampini PetscInt *PETSC_RESTRICT pBuf; 2123c80a6c00SStefano Zampini ierr = PetscSectionAddDof(section, p, 1);CHKERRQ(ierr); 2124c80a6c00SStefano Zampini ierr = PetscSegBufferGetInts(adjBuffer, 1, &pBuf);CHKERRQ(ierr); 2125c80a6c00SStefano Zampini *pBuf = point; 2126c80a6c00SStefano Zampini } 2127c80a6c00SStefano Zampini } 2128c80a6c00SStefano Zampini n++; 2129c80a6c00SStefano Zampini } 2130c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseCone(dm, useCone);CHKERRQ(ierr); 2131c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseClosure(dm, useClosure);CHKERRQ(ierr); 2132c80a6c00SStefano Zampini /* Derive CSR graph from section/segbuffer */ 2133c80a6c00SStefano Zampini ierr = PetscSectionSetUp(section);CHKERRQ(ierr); 2134c80a6c00SStefano Zampini ierr = PetscSectionGetStorageSize(section, &size);CHKERRQ(ierr); 2135c80a6c00SStefano Zampini ierr = PetscMalloc1(n+1, &xadj);CHKERRQ(ierr); 2136c80a6c00SStefano Zampini for (idx = 0, p = pStart; p < pEnd; p++) { 2137c80a6c00SStefano Zampini if (nroots > 0) {if (cellNum[p] < 0) continue;} 2138c80a6c00SStefano Zampini ierr = PetscSectionGetOffset(section, p, &(xadj[idx++]));CHKERRQ(ierr); 2139c80a6c00SStefano Zampini } 2140c80a6c00SStefano Zampini xadj[n] = size; 2141c80a6c00SStefano Zampini ierr = PetscSegBufferExtractAlloc(adjBuffer, &adjncy);CHKERRQ(ierr); 2142c80a6c00SStefano Zampini /* Clean up */ 2143c80a6c00SStefano Zampini ierr = PetscSegBufferDestroy(&adjBuffer);CHKERRQ(ierr); 2144c80a6c00SStefano Zampini ierr = PetscSectionDestroy(§ion);CHKERRQ(ierr); 2145c80a6c00SStefano Zampini ierr = PetscFree(adj);CHKERRQ(ierr); 2146c80a6c00SStefano Zampini graph->xadj = xadj; 2147c80a6c00SStefano Zampini graph->adjncy = adjncy; 2148c80a6c00SStefano Zampini } else { 2149c80a6c00SStefano Zampini Mat A; 2150c80a6c00SStefano Zampini PetscBool filter = PETSC_FALSE, isseqaij, flg_row; 2151c80a6c00SStefano Zampini 2152c80a6c00SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 215363c961adSStefano Zampini if (!A->rmap->N || !A->cmap->N) { 2154a2eca866SStefano Zampini ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr); 215563c961adSStefano Zampini PetscFunctionReturn(0); 215663c961adSStefano Zampini } 21574f1b2e48SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 21584f1b2e48SStefano Zampini if (!isseqaij && filter) { 21591cf9b237SStefano Zampini PetscBool isseqdense; 21601cf9b237SStefano Zampini 21611cf9b237SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQDENSE,&isseqdense);CHKERRQ(ierr); 21621cf9b237SStefano Zampini if (!isseqdense) { 21634f1b2e48SStefano Zampini ierr = MatConvert(A,MATSEQAIJ,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr); 21641cf9b237SStefano Zampini } else { /* TODO: rectangular case and LDA */ 21651cf9b237SStefano Zampini PetscScalar *array; 21661cf9b237SStefano Zampini PetscReal chop=1.e-6; 21671cf9b237SStefano Zampini 21681cf9b237SStefano Zampini ierr = MatDuplicate(A,MAT_COPY_VALUES,&B);CHKERRQ(ierr); 21691cf9b237SStefano Zampini ierr = MatDenseGetArray(B,&array);CHKERRQ(ierr); 21701cf9b237SStefano Zampini ierr = MatGetSize(B,&n,NULL);CHKERRQ(ierr); 21711cf9b237SStefano Zampini for (i=0;i<n;i++) { 21721cf9b237SStefano Zampini PetscInt j; 21731cf9b237SStefano Zampini for (j=i+1;j<n;j++) { 21741cf9b237SStefano Zampini PetscReal thresh = chop*(PetscAbsScalar(array[i*(n+1)])+PetscAbsScalar(array[j*(n+1)])); 21751cf9b237SStefano Zampini if (PetscAbsScalar(array[i*n+j]) < thresh) array[i*n+j] = 0.; 21761cf9b237SStefano Zampini if (PetscAbsScalar(array[j*n+i]) < thresh) array[j*n+i] = 0.; 21771cf9b237SStefano Zampini } 21781cf9b237SStefano Zampini } 21791cf9b237SStefano Zampini ierr = MatDenseRestoreArray(B,&array);CHKERRQ(ierr); 21809d54b7f4SStefano Zampini ierr = MatConvert(B,MATSEQAIJ,MAT_INPLACE_MATRIX,&B);CHKERRQ(ierr); 21811cf9b237SStefano Zampini } 21824f1b2e48SStefano Zampini } else { 2183c80a6c00SStefano Zampini ierr = PetscObjectReference((PetscObject)A);CHKERRQ(ierr); 21844f1b2e48SStefano Zampini B = A; 21854f1b2e48SStefano Zampini } 21864f1b2e48SStefano Zampini ierr = MatGetRowIJ(B,0,PETSC_TRUE,PETSC_FALSE,&n,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 21874f1b2e48SStefano Zampini 21884f1b2e48SStefano Zampini /* if filter is true, then removes entries lower than PETSC_SMALL in magnitude */ 21894f1b2e48SStefano Zampini if (filter) { 21904f1b2e48SStefano Zampini PetscScalar *data; 21914f1b2e48SStefano Zampini PetscInt j,cum; 21924f1b2e48SStefano Zampini 21934f1b2e48SStefano Zampini ierr = PetscCalloc2(n+1,&xadj_filtered,xadj[n],&adjncy_filtered);CHKERRQ(ierr); 21944f1b2e48SStefano Zampini ierr = MatSeqAIJGetArray(B,&data);CHKERRQ(ierr); 21954f1b2e48SStefano Zampini cum = 0; 21964f1b2e48SStefano Zampini for (i=0;i<n;i++) { 21974f1b2e48SStefano Zampini PetscInt t; 21984f1b2e48SStefano Zampini 21994f1b2e48SStefano Zampini for (j=xadj[i];j<xadj[i+1];j++) { 22004f1b2e48SStefano Zampini if (PetscUnlikely(PetscAbsScalar(data[j]) < PETSC_SMALL)) { 22014f1b2e48SStefano Zampini continue; 22024f1b2e48SStefano Zampini } 22034f1b2e48SStefano Zampini adjncy_filtered[cum+xadj_filtered[i]++] = adjncy[j]; 22044f1b2e48SStefano Zampini } 22054f1b2e48SStefano Zampini t = xadj_filtered[i]; 22064f1b2e48SStefano Zampini xadj_filtered[i] = cum; 22074f1b2e48SStefano Zampini cum += t; 22084f1b2e48SStefano Zampini } 22094f1b2e48SStefano Zampini ierr = MatSeqAIJRestoreArray(B,&data);CHKERRQ(ierr); 22104f1b2e48SStefano Zampini graph->xadj = xadj_filtered; 22114f1b2e48SStefano Zampini graph->adjncy = adjncy_filtered; 22124f1b2e48SStefano Zampini } else { 22134f1b2e48SStefano Zampini graph->xadj = xadj; 22144f1b2e48SStefano Zampini graph->adjncy = adjncy; 22154f1b2e48SStefano Zampini } 2216c80a6c00SStefano Zampini } 2217c80a6c00SStefano Zampini /* compute local connected components using PCBDDCGraph */ 2218c80a6c00SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n,0,1,&is_dummy);CHKERRQ(ierr); 2219c80a6c00SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_dummy,&l2gmap_dummy);CHKERRQ(ierr); 2220c80a6c00SStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 2221c80a6c00SStefano Zampini ierr = PCBDDCGraphInit(graph,l2gmap_dummy,n,PETSC_MAX_INT);CHKERRQ(ierr); 2222c80a6c00SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2gmap_dummy);CHKERRQ(ierr); 22234f1b2e48SStefano Zampini ierr = PCBDDCGraphSetUp(graph,1,NULL,NULL,0,NULL,NULL);CHKERRQ(ierr); 22244f1b2e48SStefano Zampini ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr); 2225c80a6c00SStefano Zampini 22264f1b2e48SStefano Zampini /* partial clean up */ 22274f1b2e48SStefano Zampini ierr = PetscFree2(xadj_filtered,adjncy_filtered);CHKERRQ(ierr); 2228c80a6c00SStefano Zampini if (B) { 2229c80a6c00SStefano Zampini PetscBool flg_row; 22304f1b2e48SStefano Zampini ierr = MatRestoreRowIJ(B,0,PETSC_TRUE,PETSC_FALSE,&n,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 22314f1b2e48SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 22324f1b2e48SStefano Zampini } 2233c80a6c00SStefano Zampini if (isplex) { 2234c80a6c00SStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 2235c80a6c00SStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 2236c80a6c00SStefano Zampini } 22374f1b2e48SStefano Zampini 22384f1b2e48SStefano Zampini /* get back data */ 2239c80a6c00SStefano Zampini if (isplex) { 2240c80a6c00SStefano Zampini if (ncc) *ncc = graph->ncc; 2241c80a6c00SStefano Zampini if (cc || primalv) { 2242c80a6c00SStefano Zampini Mat A; 2243c80a6c00SStefano Zampini PetscBT btv,btvt; 2244c80a6c00SStefano Zampini PetscSection subSection; 2245c80a6c00SStefano Zampini PetscInt *ids,cum,cump,*cids,*pids; 2246c80a6c00SStefano Zampini 2247c80a6c00SStefano Zampini ierr = DMPlexGetSubdomainSection(dm,&subSection);CHKERRQ(ierr); 2248c80a6c00SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 2249c80a6c00SStefano Zampini ierr = PetscMalloc3(A->rmap->n,&ids,graph->ncc+1,&cids,A->rmap->n,&pids);CHKERRQ(ierr); 2250c80a6c00SStefano Zampini ierr = PetscBTCreate(A->rmap->n,&btv);CHKERRQ(ierr); 2251c80a6c00SStefano Zampini ierr = PetscBTCreate(A->rmap->n,&btvt);CHKERRQ(ierr); 2252c80a6c00SStefano Zampini 2253c80a6c00SStefano Zampini cids[0] = 0; 2254c80a6c00SStefano Zampini for (i = 0, cump = 0, cum = 0; i < graph->ncc; i++) { 2255c80a6c00SStefano Zampini PetscInt j; 2256c80a6c00SStefano Zampini 2257c80a6c00SStefano Zampini ierr = PetscBTMemzero(A->rmap->n,btvt);CHKERRQ(ierr); 2258c80a6c00SStefano Zampini for (j = graph->cptr[i]; j < graph->cptr[i+1]; j++) { 2259c80a6c00SStefano Zampini PetscInt k, size, *closure = NULL, cell = graph->queue[j]; 2260c80a6c00SStefano Zampini 2261c80a6c00SStefano Zampini ierr = DMPlexGetTransitiveClosure(dm,cell,PETSC_TRUE,&size,&closure);CHKERRQ(ierr); 2262c80a6c00SStefano Zampini for (k = 0; k < 2*size; k += 2) { 2263c80a6c00SStefano Zampini PetscInt s, p = closure[k], off, dof, cdof; 2264c80a6c00SStefano Zampini 2265c80a6c00SStefano Zampini ierr = PetscSectionGetConstraintDof(subSection, p, &cdof);CHKERRQ(ierr); 2266c80a6c00SStefano Zampini ierr = PetscSectionGetOffset(subSection,p,&off);CHKERRQ(ierr); 2267c80a6c00SStefano Zampini ierr = PetscSectionGetDof(subSection,p,&dof);CHKERRQ(ierr); 2268c80a6c00SStefano Zampini for (s = 0; s < dof-cdof; s++) { 2269c80a6c00SStefano Zampini if (PetscBTLookupSet(btvt,off+s)) continue; 2270c80a6c00SStefano Zampini if (!PetscBTLookup(btv,off+s)) { 2271c80a6c00SStefano Zampini ids[cum++] = off+s; 2272c80a6c00SStefano Zampini } else { /* cross-vertex */ 2273c80a6c00SStefano Zampini pids[cump++] = off+s; 2274c80a6c00SStefano Zampini } 2275c80a6c00SStefano Zampini } 2276c80a6c00SStefano Zampini } 2277c80a6c00SStefano Zampini ierr = DMPlexRestoreTransitiveClosure(dm,cell,PETSC_TRUE,&size,&closure);CHKERRQ(ierr); 2278c80a6c00SStefano Zampini } 2279c80a6c00SStefano Zampini cids[i+1] = cum; 2280c80a6c00SStefano Zampini /* mark dofs as already assigned */ 2281c80a6c00SStefano Zampini for (j = cids[i]; j < cids[i+1]; j++) { 2282c80a6c00SStefano Zampini ierr = PetscBTSet(btv,ids[j]);CHKERRQ(ierr); 2283c80a6c00SStefano Zampini } 2284c80a6c00SStefano Zampini } 2285c80a6c00SStefano Zampini if (cc) { 2286c80a6c00SStefano Zampini ierr = PetscMalloc1(graph->ncc,&cc_n);CHKERRQ(ierr); 2287c80a6c00SStefano Zampini for (i = 0; i < graph->ncc; i++) { 2288c80a6c00SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cids[i+1]-cids[i],ids+cids[i],PETSC_COPY_VALUES,&cc_n[i]);CHKERRQ(ierr); 2289c80a6c00SStefano Zampini } 2290c80a6c00SStefano Zampini *cc = cc_n; 2291c80a6c00SStefano Zampini } 2292c80a6c00SStefano Zampini if (primalv) { 2293c80a6c00SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),cump,pids,PETSC_COPY_VALUES,primalv);CHKERRQ(ierr); 2294c80a6c00SStefano Zampini } 2295c80a6c00SStefano Zampini ierr = PetscFree3(ids,cids,pids);CHKERRQ(ierr); 2296c80a6c00SStefano Zampini ierr = PetscBTDestroy(&btv);CHKERRQ(ierr); 2297c80a6c00SStefano Zampini ierr = PetscBTDestroy(&btvt);CHKERRQ(ierr); 2298c80a6c00SStefano Zampini } 2299c80a6c00SStefano Zampini } else { 23001cf9b237SStefano Zampini if (ncc) *ncc = graph->ncc; 23011cf9b237SStefano Zampini if (cc) { 23024f1b2e48SStefano Zampini ierr = PetscMalloc1(graph->ncc,&cc_n);CHKERRQ(ierr); 23034f1b2e48SStefano Zampini for (i=0;i<graph->ncc;i++) { 23044f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,graph->cptr[i+1]-graph->cptr[i],graph->queue+graph->cptr[i],PETSC_COPY_VALUES,&cc_n[i]);CHKERRQ(ierr); 23054f1b2e48SStefano Zampini } 23064f1b2e48SStefano Zampini *cc = cc_n; 23071cf9b237SStefano Zampini } 2308c80a6c00SStefano Zampini } 23094f1b2e48SStefano Zampini /* clean up graph */ 23104f1b2e48SStefano Zampini graph->xadj = 0; 23114f1b2e48SStefano Zampini graph->adjncy = 0; 23124f1b2e48SStefano Zampini ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr); 23134f1b2e48SStefano Zampini PetscFunctionReturn(0); 23144f1b2e48SStefano Zampini } 23154f1b2e48SStefano Zampini 23165408967cSStefano Zampini PetscErrorCode PCBDDCBenignCheck(PC pc, IS zerodiag) 23175408967cSStefano Zampini { 23185408967cSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 23195408967cSStefano Zampini PC_IS* pcis = (PC_IS*)(pc->data); 2320dee84bffSStefano Zampini IS dirIS = NULL; 23214f1b2e48SStefano Zampini PetscInt i; 23225408967cSStefano Zampini PetscErrorCode ierr; 23235408967cSStefano Zampini 23245408967cSStefano Zampini PetscFunctionBegin; 2325dee84bffSStefano Zampini ierr = PCBDDCGraphGetDirichletDofs(pcbddc->mat_graph,&dirIS);CHKERRQ(ierr); 23265408967cSStefano Zampini if (zerodiag) { 23275408967cSStefano Zampini Mat A; 23285408967cSStefano Zampini Vec vec3_N; 23295408967cSStefano Zampini PetscScalar *vals; 23305408967cSStefano Zampini const PetscInt *idxs; 2331d12d3064SStefano Zampini PetscInt nz,*count; 23325408967cSStefano Zampini 23335408967cSStefano Zampini /* p0 */ 23345408967cSStefano Zampini ierr = VecSet(pcis->vec1_N,0.);CHKERRQ(ierr); 23355408967cSStefano Zampini ierr = PetscMalloc1(pcis->n,&vals);CHKERRQ(ierr); 23365408967cSStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 23375408967cSStefano Zampini ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr); 23384f1b2e48SStefano Zampini for (i=0;i<nz;i++) vals[i] = 1.; 23395408967cSStefano Zampini ierr = VecSetValues(pcis->vec1_N,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23405408967cSStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 23415408967cSStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 23425408967cSStefano Zampini /* v_I */ 23435408967cSStefano Zampini ierr = VecSetRandom(pcis->vec2_N,NULL);CHKERRQ(ierr); 23445408967cSStefano Zampini for (i=0;i<nz;i++) vals[i] = 0.; 23455408967cSStefano Zampini ierr = VecSetValues(pcis->vec2_N,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23465408967cSStefano Zampini ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr); 23475408967cSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 23485408967cSStefano Zampini for (i=0;i<pcis->n_B;i++) vals[i] = 0.; 23495408967cSStefano Zampini ierr = VecSetValues(pcis->vec2_N,pcis->n_B,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23505408967cSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 23515408967cSStefano Zampini if (dirIS) { 23525408967cSStefano Zampini PetscInt n; 23535408967cSStefano Zampini 23545408967cSStefano Zampini ierr = ISGetLocalSize(dirIS,&n);CHKERRQ(ierr); 23555408967cSStefano Zampini ierr = ISGetIndices(dirIS,&idxs);CHKERRQ(ierr); 23565408967cSStefano Zampini for (i=0;i<n;i++) vals[i] = 0.; 23575408967cSStefano Zampini ierr = VecSetValues(pcis->vec2_N,n,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23585408967cSStefano Zampini ierr = ISRestoreIndices(dirIS,&idxs);CHKERRQ(ierr); 23595408967cSStefano Zampini } 23605408967cSStefano Zampini ierr = VecAssemblyBegin(pcis->vec2_N);CHKERRQ(ierr); 23615408967cSStefano Zampini ierr = VecAssemblyEnd(pcis->vec2_N);CHKERRQ(ierr); 23625408967cSStefano Zampini ierr = VecDuplicate(pcis->vec1_N,&vec3_N);CHKERRQ(ierr); 23635408967cSStefano Zampini ierr = VecSet(vec3_N,0.);CHKERRQ(ierr); 2364669cc0f4SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 23655408967cSStefano Zampini ierr = MatMult(A,pcis->vec1_N,vec3_N);CHKERRQ(ierr); 23665408967cSStefano Zampini ierr = VecDot(vec3_N,pcis->vec2_N,&vals[0]);CHKERRQ(ierr); 23679a962809SStefano Zampini if (PetscAbsScalar(vals[0]) > 1.e-1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Benign trick can not be applied! b(v_I,p_0) = %1.6e (should be numerically 0.)",PetscAbsScalar(vals[0])); 23685408967cSStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 23695408967cSStefano Zampini ierr = VecDestroy(&vec3_N);CHKERRQ(ierr); 2370d12d3064SStefano Zampini 2371d12d3064SStefano Zampini /* there should not be any pressure dofs lying on the interface */ 2372d12d3064SStefano Zampini ierr = PetscCalloc1(pcis->n,&count);CHKERRQ(ierr); 2373d12d3064SStefano Zampini ierr = ISGetIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 2374d12d3064SStefano Zampini for (i=0;i<pcis->n_B;i++) count[idxs[i]]++; 2375d12d3064SStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 2376d12d3064SStefano Zampini ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr); 23779a962809SStefano Zampini for (i=0;i<nz;i++) if (count[idxs[i]]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Benign trick can not be applied! pressure dof %d is an interface dof",idxs[i]); 2378d12d3064SStefano Zampini ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr); 2379d12d3064SStefano Zampini ierr = PetscFree(count);CHKERRQ(ierr); 23805408967cSStefano Zampini } 2381dee84bffSStefano Zampini ierr = ISDestroy(&dirIS);CHKERRQ(ierr); 23825408967cSStefano Zampini 23835408967cSStefano Zampini /* check PCBDDCBenignGetOrSetP0 */ 23845408967cSStefano Zampini ierr = VecSetRandom(pcis->vec1_global,NULL);CHKERRQ(ierr); 23854f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = -PetscGlobalRank-i; 23865408967cSStefano Zampini ierr = PCBDDCBenignGetOrSetP0(pc,pcis->vec1_global,PETSC_FALSE);CHKERRQ(ierr); 23874f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = 1; 23885408967cSStefano Zampini ierr = PCBDDCBenignGetOrSetP0(pc,pcis->vec1_global,PETSC_TRUE);CHKERRQ(ierr); 2389f2a566d8SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 2390f2a566d8SStefano Zampini PetscInt val = PetscRealPart(pcbddc->benign_p0[i]); 239113903a91SSatish Balay if (val != -PetscGlobalRank-i) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error testing PCBDDCBenignGetOrSetP0! Found %g at %d instead of %g\n",PetscRealPart(pcbddc->benign_p0[i]),i,-PetscGlobalRank-i); 2392f2a566d8SStefano Zampini } 23935408967cSStefano Zampini PetscFunctionReturn(0); 23945408967cSStefano Zampini } 23955408967cSStefano Zampini 2396339f8db1SStefano Zampini PetscErrorCode PCBDDCBenignDetectSaddlePoint(PC pc, IS *zerodiaglocal) 2397339f8db1SStefano Zampini { 2398339f8db1SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 23994edc6404Sstefano_zampini IS pressures,zerodiag,zerodiag_save,*zerodiag_subs; 2400b0f5fe93SStefano Zampini PetscInt nz,n; 24014edc6404Sstefano_zampini PetscInt *interior_dofs,n_interior_dofs,nneu; 24024edc6404Sstefano_zampini PetscBool sorted,have_null,has_null_pressures,recompute_zerodiag,checkb; 2403339f8db1SStefano Zampini PetscErrorCode ierr; 2404339f8db1SStefano Zampini 2405339f8db1SStefano Zampini PetscFunctionBegin; 24069f47a83aSStefano Zampini ierr = PetscSFDestroy(&pcbddc->benign_sf);CHKERRQ(ierr); 24079f47a83aSStefano Zampini ierr = MatDestroy(&pcbddc->benign_B0);CHKERRQ(ierr); 2408a3df083aSStefano Zampini for (n=0;n<pcbddc->benign_n;n++) { 2409a3df083aSStefano Zampini ierr = ISDestroy(&pcbddc->benign_zerodiag_subs[n]);CHKERRQ(ierr); 2410a3df083aSStefano Zampini } 2411a3df083aSStefano Zampini ierr = PetscFree(pcbddc->benign_zerodiag_subs);CHKERRQ(ierr); 2412a3df083aSStefano Zampini pcbddc->benign_n = 0; 241328b8efb1Sstefano_zampini 241428b8efb1Sstefano_zampini /* if a local info on dofs is present, uses the last field for "pressures" (or fid by command line) 24154f1b2e48SStefano Zampini otherwise, it uses only zerodiagonal dofs (ok if the pressure block is all zero; it could fail if it is not) 24164f1b2e48SStefano Zampini Checks if all the pressure dofs in each subdomain have a zero diagonal 24174f1b2e48SStefano Zampini If not, a change of basis on pressures is not needed 24181ae86dd6SStefano Zampini since the local Schur complements are already SPD 24194f1b2e48SStefano Zampini */ 24204f1b2e48SStefano Zampini has_null_pressures = PETSC_TRUE; 24214f1b2e48SStefano Zampini have_null = PETSC_TRUE; 242240fa8d13SStefano Zampini if (pcbddc->n_ISForDofsLocal) { 24237fbe2174Sstefano_zampini IS iP = NULL; 24244f1b2e48SStefano Zampini PetscInt npl,*idxs,p = pcbddc->n_ISForDofsLocal-1; 24254f1b2e48SStefano Zampini 242628b8efb1Sstefano_zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC benign options","PC");CHKERRQ(ierr); 242728b8efb1Sstefano_zampini ierr = PetscOptionsInt("-pc_bddc_pressure_field","Field id for pressures",NULL,p,&p,NULL);CHKERRQ(ierr); 242828b8efb1Sstefano_zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 242928b8efb1Sstefano_zampini if (p < 0 || p > pcbddc->n_ISForDofsLocal-1) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Invalid field id for pressures %D",p); 24304f1b2e48SStefano Zampini /* Dofs splitting for BDDC cannot have PETSC_COMM_SELF, so create a sequential IS */ 24314f1b2e48SStefano Zampini ierr = ISGetLocalSize(pcbddc->ISForDofsLocal[p],&npl);CHKERRQ(ierr); 24324f1b2e48SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofsLocal[p],(const PetscInt**)&idxs);CHKERRQ(ierr); 24334f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,npl,idxs,PETSC_COPY_VALUES,&pressures);CHKERRQ(ierr); 2434ba14f8e3SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofsLocal[p],(const PetscInt**)&idxs);CHKERRQ(ierr); 24357fbe2174Sstefano_zampini /* remove zeroed out pressures if we are setting up a BDDC solver for a saddle-point FETI-DP */ 24367fbe2174Sstefano_zampini ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_lP",(PetscObject*)&iP);CHKERRQ(ierr); 24377fbe2174Sstefano_zampini if (iP) { 24387fbe2174Sstefano_zampini IS newpressures; 24397fbe2174Sstefano_zampini 24407fbe2174Sstefano_zampini ierr = ISDifference(pressures,iP,&newpressures);CHKERRQ(ierr); 24417fbe2174Sstefano_zampini ierr = ISDestroy(&pressures);CHKERRQ(ierr); 24427fbe2174Sstefano_zampini pressures = newpressures; 24437fbe2174Sstefano_zampini } 244440fa8d13SStefano Zampini ierr = ISSorted(pressures,&sorted);CHKERRQ(ierr); 244540fa8d13SStefano Zampini if (!sorted) { 244640fa8d13SStefano Zampini ierr = ISSort(pressures);CHKERRQ(ierr); 244740fa8d13SStefano Zampini } 244840fa8d13SStefano Zampini } else { 244940fa8d13SStefano Zampini pressures = NULL; 245040fa8d13SStefano Zampini } 245197d764eeSStefano Zampini /* pcis has not been setup yet, so get the local size from the subdomain matrix */ 245297d764eeSStefano Zampini ierr = MatGetLocalSize(pcbddc->local_mat,&n,NULL);CHKERRQ(ierr); 245327b6a85dSStefano Zampini if (!n) pcbddc->benign_change_explicit = PETSC_TRUE; 245497d764eeSStefano Zampini ierr = MatFindZeroDiagonals(pcbddc->local_mat,&zerodiag);CHKERRQ(ierr); 2455339f8db1SStefano Zampini ierr = ISSorted(zerodiag,&sorted);CHKERRQ(ierr); 2456339f8db1SStefano Zampini if (!sorted) { 2457339f8db1SStefano Zampini ierr = ISSort(zerodiag);CHKERRQ(ierr); 2458339f8db1SStefano Zampini } 24594edc6404Sstefano_zampini ierr = PetscObjectReference((PetscObject)zerodiag);CHKERRQ(ierr); 24604edc6404Sstefano_zampini zerodiag_save = zerodiag; 2461339f8db1SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 24624f1b2e48SStefano Zampini if (!nz) { 24634f1b2e48SStefano Zampini if (n) have_null = PETSC_FALSE; 24644f1b2e48SStefano Zampini has_null_pressures = PETSC_FALSE; 246540fa8d13SStefano Zampini ierr = ISDestroy(&zerodiag);CHKERRQ(ierr); 246640fa8d13SStefano Zampini } 24674f1b2e48SStefano Zampini recompute_zerodiag = PETSC_FALSE; 24684f1b2e48SStefano Zampini /* in case disconnected subdomains info is present, split the pressures accordingly (otherwise the benign trick could fail) */ 24694f1b2e48SStefano Zampini zerodiag_subs = NULL; 24704f1b2e48SStefano Zampini pcbddc->benign_n = 0; 24711f4df5f7SStefano Zampini n_interior_dofs = 0; 24721f4df5f7SStefano Zampini interior_dofs = NULL; 24734edc6404Sstefano_zampini nneu = 0; 24744edc6404Sstefano_zampini if (pcbddc->NeumannBoundariesLocal) { 24754edc6404Sstefano_zampini ierr = ISGetLocalSize(pcbddc->NeumannBoundariesLocal,&nneu);CHKERRQ(ierr); 24764edc6404Sstefano_zampini } 24773369cb78Sstefano_zampini checkb = (PetscBool)(!pcbddc->NeumannBoundariesLocal || pcbddc->current_level); 24784edc6404Sstefano_zampini if (checkb) { /* need to compute interior nodes */ 24791f4df5f7SStefano Zampini PetscInt n,i,j; 24801f4df5f7SStefano Zampini PetscInt n_neigh,*neigh,*n_shared,**shared; 24811f4df5f7SStefano Zampini PetscInt *iwork; 24821f4df5f7SStefano Zampini 24831f4df5f7SStefano Zampini ierr = ISLocalToGlobalMappingGetSize(pc->pmat->rmap->mapping,&n);CHKERRQ(ierr); 24841f4df5f7SStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(pc->pmat->rmap->mapping,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 24851f4df5f7SStefano Zampini ierr = PetscCalloc1(n,&iwork);CHKERRQ(ierr); 24861f4df5f7SStefano Zampini ierr = PetscMalloc1(n,&interior_dofs);CHKERRQ(ierr); 248790648384SStefano Zampini for (i=1;i<n_neigh;i++) 24881f4df5f7SStefano Zampini for (j=0;j<n_shared[i];j++) 24891f4df5f7SStefano Zampini iwork[shared[i][j]] += 1; 24901f4df5f7SStefano Zampini for (i=0;i<n;i++) 24911f4df5f7SStefano Zampini if (!iwork[i]) 24921f4df5f7SStefano Zampini interior_dofs[n_interior_dofs++] = i; 24931f4df5f7SStefano Zampini ierr = PetscFree(iwork);CHKERRQ(ierr); 24941f4df5f7SStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(pc->pmat->rmap->mapping,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 24951f4df5f7SStefano Zampini } 24964f1b2e48SStefano Zampini if (has_null_pressures) { 24974f1b2e48SStefano Zampini IS *subs; 24984edc6404Sstefano_zampini PetscInt nsubs,i,j,nl; 24991f4df5f7SStefano Zampini const PetscInt *idxs; 25001f4df5f7SStefano Zampini PetscScalar *array; 25011f4df5f7SStefano Zampini Vec *work; 25021f4df5f7SStefano Zampini Mat_IS* matis = (Mat_IS*)(pc->pmat->data); 25034f1b2e48SStefano Zampini 25044f1b2e48SStefano Zampini subs = pcbddc->local_subs; 25054f1b2e48SStefano Zampini nsubs = pcbddc->n_local_subs; 25061f4df5f7SStefano Zampini /* these vectors are needed to check if the constant on pressures is in the kernel of the local operator B (i.e. B(v_I,p0) should be zero) */ 25074edc6404Sstefano_zampini if (checkb) { 25081f4df5f7SStefano Zampini ierr = VecDuplicateVecs(matis->y,2,&work);CHKERRQ(ierr); 25091f4df5f7SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nl);CHKERRQ(ierr); 25101f4df5f7SStefano Zampini ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr); 25111f4df5f7SStefano Zampini /* work[0] = 1_p */ 25121f4df5f7SStefano Zampini ierr = VecSet(work[0],0.);CHKERRQ(ierr); 25131f4df5f7SStefano Zampini ierr = VecGetArray(work[0],&array);CHKERRQ(ierr); 25141f4df5f7SStefano Zampini for (j=0;j<nl;j++) array[idxs[j]] = 1.; 25151f4df5f7SStefano Zampini ierr = VecRestoreArray(work[0],&array);CHKERRQ(ierr); 25161f4df5f7SStefano Zampini /* work[0] = 1_v */ 25171f4df5f7SStefano Zampini ierr = VecSet(work[1],1.);CHKERRQ(ierr); 25181f4df5f7SStefano Zampini ierr = VecGetArray(work[1],&array);CHKERRQ(ierr); 25191f4df5f7SStefano Zampini for (j=0;j<nl;j++) array[idxs[j]] = 0.; 25201f4df5f7SStefano Zampini ierr = VecRestoreArray(work[1],&array);CHKERRQ(ierr); 25211f4df5f7SStefano Zampini ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr); 25221f4df5f7SStefano Zampini } 25234f1b2e48SStefano Zampini if (nsubs > 1) { 25244f1b2e48SStefano Zampini ierr = PetscCalloc1(nsubs,&zerodiag_subs);CHKERRQ(ierr); 25254f1b2e48SStefano Zampini for (i=0;i<nsubs;i++) { 25264f1b2e48SStefano Zampini ISLocalToGlobalMapping l2g; 25274f1b2e48SStefano Zampini IS t_zerodiag_subs; 25284f1b2e48SStefano Zampini PetscInt nl; 25294f1b2e48SStefano Zampini 25304f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(subs[i],&l2g);CHKERRQ(ierr); 25314f1b2e48SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(l2g,IS_GTOLM_DROP,zerodiag,&t_zerodiag_subs);CHKERRQ(ierr); 25324f1b2e48SStefano Zampini ierr = ISGetLocalSize(t_zerodiag_subs,&nl);CHKERRQ(ierr); 25334f1b2e48SStefano Zampini if (nl) { 25344f1b2e48SStefano Zampini PetscBool valid = PETSC_TRUE; 25354f1b2e48SStefano Zampini 25364edc6404Sstefano_zampini if (checkb) { 25371f4df5f7SStefano Zampini ierr = VecSet(matis->x,0);CHKERRQ(ierr); 25381f4df5f7SStefano Zampini ierr = ISGetLocalSize(subs[i],&nl);CHKERRQ(ierr); 25391f4df5f7SStefano Zampini ierr = ISGetIndices(subs[i],&idxs);CHKERRQ(ierr); 25401f4df5f7SStefano Zampini ierr = VecGetArray(matis->x,&array);CHKERRQ(ierr); 25411f4df5f7SStefano Zampini for (j=0;j<nl;j++) array[idxs[j]] = 1.; 25421f4df5f7SStefano Zampini ierr = VecRestoreArray(matis->x,&array);CHKERRQ(ierr); 25431f4df5f7SStefano Zampini ierr = ISRestoreIndices(subs[i],&idxs);CHKERRQ(ierr); 25441f4df5f7SStefano Zampini ierr = VecPointwiseMult(matis->x,work[0],matis->x);CHKERRQ(ierr); 25451f4df5f7SStefano Zampini ierr = MatMult(matis->A,matis->x,matis->y);CHKERRQ(ierr); 25461f4df5f7SStefano Zampini ierr = VecPointwiseMult(matis->y,work[1],matis->y);CHKERRQ(ierr); 25471f4df5f7SStefano Zampini ierr = VecGetArray(matis->y,&array);CHKERRQ(ierr); 25481f4df5f7SStefano Zampini for (j=0;j<n_interior_dofs;j++) { 25491f4df5f7SStefano Zampini if (PetscAbsScalar(array[interior_dofs[j]]) > PETSC_SMALL) { 25501f4df5f7SStefano Zampini valid = PETSC_FALSE; 25511f4df5f7SStefano Zampini break; 25521f4df5f7SStefano Zampini } 25531f4df5f7SStefano Zampini } 25541f4df5f7SStefano Zampini ierr = VecRestoreArray(matis->y,&array);CHKERRQ(ierr); 25551f4df5f7SStefano Zampini } 25566632bad2Sstefano_zampini if (valid && nneu) { 25576632bad2Sstefano_zampini const PetscInt *idxs; 25581f4df5f7SStefano Zampini PetscInt nzb; 25591f4df5f7SStefano Zampini 25606632bad2Sstefano_zampini ierr = ISGetIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 25616632bad2Sstefano_zampini ierr = ISGlobalToLocalMappingApply(l2g,IS_GTOLM_DROP,nneu,idxs,&nzb,NULL);CHKERRQ(ierr); 25626632bad2Sstefano_zampini ierr = ISRestoreIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 25631f4df5f7SStefano Zampini if (nzb) valid = PETSC_FALSE; 25641f4df5f7SStefano Zampini } 25651f4df5f7SStefano Zampini if (valid && pressures) { 25664f1b2e48SStefano Zampini IS t_pressure_subs; 25674f1b2e48SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(l2g,IS_GTOLM_DROP,pressures,&t_pressure_subs);CHKERRQ(ierr); 25684f1b2e48SStefano Zampini ierr = ISEqual(t_pressure_subs,t_zerodiag_subs,&valid);CHKERRQ(ierr); 25694f1b2e48SStefano Zampini ierr = ISDestroy(&t_pressure_subs);CHKERRQ(ierr); 25704f1b2e48SStefano Zampini } 25714f1b2e48SStefano Zampini if (valid) { 25724f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(l2g,t_zerodiag_subs,&zerodiag_subs[pcbddc->benign_n]);CHKERRQ(ierr); 25734f1b2e48SStefano Zampini pcbddc->benign_n++; 25744f1b2e48SStefano Zampini } else { 25754f1b2e48SStefano Zampini recompute_zerodiag = PETSC_TRUE; 25764f1b2e48SStefano Zampini } 25774f1b2e48SStefano Zampini } 25784f1b2e48SStefano Zampini ierr = ISDestroy(&t_zerodiag_subs);CHKERRQ(ierr); 25794f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2g);CHKERRQ(ierr); 25804f1b2e48SStefano Zampini } 25814f1b2e48SStefano Zampini } else { /* there's just one subdomain (or zero if they have not been detected */ 25824f1b2e48SStefano Zampini PetscBool valid = PETSC_TRUE; 25831f4df5f7SStefano Zampini 25846632bad2Sstefano_zampini if (nneu) valid = PETSC_FALSE; 25851f4df5f7SStefano Zampini if (valid && pressures) { 25864f1b2e48SStefano Zampini ierr = ISEqual(pressures,zerodiag,&valid);CHKERRQ(ierr); 25874f1b2e48SStefano Zampini } 25884edc6404Sstefano_zampini if (valid && checkb) { 25891f4df5f7SStefano Zampini ierr = MatMult(matis->A,work[0],matis->x);CHKERRQ(ierr); 25901f4df5f7SStefano Zampini ierr = VecPointwiseMult(matis->x,work[1],matis->x);CHKERRQ(ierr); 25911f4df5f7SStefano Zampini ierr = VecGetArray(matis->x,&array);CHKERRQ(ierr); 25921f4df5f7SStefano Zampini for (j=0;j<n_interior_dofs;j++) { 25931f4df5f7SStefano Zampini if (PetscAbsScalar(array[interior_dofs[j]]) > PETSC_SMALL) { 25941f4df5f7SStefano Zampini valid = PETSC_FALSE; 25951f4df5f7SStefano Zampini break; 25961f4df5f7SStefano Zampini } 25971f4df5f7SStefano Zampini } 25981f4df5f7SStefano Zampini ierr = VecRestoreArray(matis->x,&array);CHKERRQ(ierr); 25991f4df5f7SStefano Zampini } 26004f1b2e48SStefano Zampini if (valid) { 26014f1b2e48SStefano Zampini pcbddc->benign_n = 1; 2602ca92afb2SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&zerodiag_subs);CHKERRQ(ierr); 26034f1b2e48SStefano Zampini ierr = PetscObjectReference((PetscObject)zerodiag);CHKERRQ(ierr); 26044f1b2e48SStefano Zampini zerodiag_subs[0] = zerodiag; 26054f1b2e48SStefano Zampini } 26064f1b2e48SStefano Zampini } 26074edc6404Sstefano_zampini if (checkb) { 26081f4df5f7SStefano Zampini ierr = VecDestroyVecs(2,&work);CHKERRQ(ierr); 26094f1b2e48SStefano Zampini } 26101f4df5f7SStefano Zampini } 26111f4df5f7SStefano Zampini ierr = PetscFree(interior_dofs);CHKERRQ(ierr); 26124f1b2e48SStefano Zampini 26134f1b2e48SStefano Zampini if (!pcbddc->benign_n) { 2614b9b0e38cSStefano Zampini PetscInt n; 2615b9b0e38cSStefano Zampini 26164f1b2e48SStefano Zampini ierr = ISDestroy(&zerodiag);CHKERRQ(ierr); 26174f1b2e48SStefano Zampini recompute_zerodiag = PETSC_FALSE; 2618b9b0e38cSStefano Zampini ierr = MatGetLocalSize(pcbddc->local_mat,&n,NULL);CHKERRQ(ierr); 2619b9b0e38cSStefano Zampini if (n) { 26204f1b2e48SStefano Zampini has_null_pressures = PETSC_FALSE; 26214f1b2e48SStefano Zampini have_null = PETSC_FALSE; 26224f1b2e48SStefano Zampini } 2623b9b0e38cSStefano Zampini } 26244f1b2e48SStefano Zampini 26254f1b2e48SStefano Zampini /* final check for null pressures */ 26264f1b2e48SStefano Zampini if (zerodiag && pressures) { 26274f1b2e48SStefano Zampini PetscInt nz,np; 26284f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 26294f1b2e48SStefano Zampini ierr = ISGetLocalSize(pressures,&np);CHKERRQ(ierr); 26304f1b2e48SStefano Zampini if (nz != np) have_null = PETSC_FALSE; 26314f1b2e48SStefano Zampini } 26324f1b2e48SStefano Zampini 26334f1b2e48SStefano Zampini if (recompute_zerodiag) { 26344f1b2e48SStefano Zampini ierr = ISDestroy(&zerodiag);CHKERRQ(ierr); 26354f1b2e48SStefano Zampini if (pcbddc->benign_n == 1) { 26364f1b2e48SStefano Zampini ierr = PetscObjectReference((PetscObject)zerodiag_subs[0]);CHKERRQ(ierr); 26374f1b2e48SStefano Zampini zerodiag = zerodiag_subs[0]; 26384f1b2e48SStefano Zampini } else { 26394f1b2e48SStefano Zampini PetscInt i,nzn,*new_idxs; 26404f1b2e48SStefano Zampini 26414f1b2e48SStefano Zampini nzn = 0; 26424f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 26434f1b2e48SStefano Zampini PetscInt ns; 26444f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[i],&ns);CHKERRQ(ierr); 26454f1b2e48SStefano Zampini nzn += ns; 26464f1b2e48SStefano Zampini } 26474f1b2e48SStefano Zampini ierr = PetscMalloc1(nzn,&new_idxs);CHKERRQ(ierr); 26484f1b2e48SStefano Zampini nzn = 0; 26494f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 26504f1b2e48SStefano Zampini PetscInt ns,*idxs; 26514f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[i],&ns);CHKERRQ(ierr); 26524f1b2e48SStefano Zampini ierr = ISGetIndices(zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 26534f1b2e48SStefano Zampini ierr = PetscMemcpy(new_idxs+nzn,idxs,ns*sizeof(PetscInt));CHKERRQ(ierr); 26544f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 26554f1b2e48SStefano Zampini nzn += ns; 26564f1b2e48SStefano Zampini } 26574f1b2e48SStefano Zampini ierr = PetscSortInt(nzn,new_idxs);CHKERRQ(ierr); 26584f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nzn,new_idxs,PETSC_OWN_POINTER,&zerodiag);CHKERRQ(ierr); 26594f1b2e48SStefano Zampini } 26604f1b2e48SStefano Zampini have_null = PETSC_FALSE; 26614f1b2e48SStefano Zampini } 26624f1b2e48SStefano Zampini 2663669cc0f4SStefano Zampini /* Prepare matrix to compute no-net-flux */ 2664a198735bSStefano Zampini if (pcbddc->compute_nonetflux && !pcbddc->divudotp) { 2665a198735bSStefano Zampini Mat A,loc_divudotp; 2666a198735bSStefano Zampini ISLocalToGlobalMapping rl2g,cl2g,l2gmap; 2667a198735bSStefano Zampini IS row,col,isused = NULL; 2668a198735bSStefano Zampini PetscInt M,N,n,st,n_isused; 2669a198735bSStefano Zampini 26701f4df5f7SStefano Zampini if (pressures) { 26711f4df5f7SStefano Zampini isused = pressures; 26721f4df5f7SStefano Zampini } else { 26734edc6404Sstefano_zampini isused = zerodiag_save; 26741f4df5f7SStefano Zampini } 2675a198735bSStefano Zampini ierr = MatGetLocalToGlobalMapping(pc->pmat,&l2gmap,NULL);CHKERRQ(ierr); 2676669cc0f4SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 26771ae86dd6SStefano Zampini ierr = MatGetLocalSize(A,&n,NULL);CHKERRQ(ierr); 26781ae86dd6SStefano Zampini if (!isused && n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Don't know how to extract div u dot p! Please provide the pressure field"); 2679a198735bSStefano Zampini n_isused = 0; 2680a198735bSStefano Zampini if (isused) { 2681a198735bSStefano Zampini ierr = ISGetLocalSize(isused,&n_isused);CHKERRQ(ierr); 2682a198735bSStefano Zampini } 2683a198735bSStefano Zampini ierr = MPI_Scan(&n_isused,&st,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 2684a198735bSStefano Zampini st = st-n_isused; 26851ae86dd6SStefano Zampini if (n) { 2686a198735bSStefano Zampini const PetscInt *gidxs; 2687a198735bSStefano Zampini 26887dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,isused,NULL,MAT_INITIAL_MATRIX,&loc_divudotp);CHKERRQ(ierr); 2689a198735bSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(l2gmap,&gidxs);CHKERRQ(ierr); 2690a198735bSStefano Zampini /* TODO: extend ISCreateStride with st = PETSC_DECIDE */ 2691a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n_isused,st,1,&row);CHKERRQ(ierr); 2692a198735bSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),n,gidxs,PETSC_COPY_VALUES,&col);CHKERRQ(ierr); 2693a198735bSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap,&gidxs);CHKERRQ(ierr); 26941ae86dd6SStefano Zampini } else { 2695a198735bSStefano Zampini ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,0,0,1,NULL,&loc_divudotp);CHKERRQ(ierr); 2696a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n_isused,st,1,&row);CHKERRQ(ierr); 2697a198735bSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),0,NULL,PETSC_COPY_VALUES,&col);CHKERRQ(ierr); 2698a198735bSStefano Zampini } 2699a198735bSStefano Zampini ierr = MatGetSize(pc->pmat,NULL,&N);CHKERRQ(ierr); 2700a198735bSStefano Zampini ierr = ISGetSize(row,&M);CHKERRQ(ierr); 2701a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(row,&rl2g);CHKERRQ(ierr); 2702a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(col,&cl2g);CHKERRQ(ierr); 2703a198735bSStefano Zampini ierr = ISDestroy(&row);CHKERRQ(ierr); 2704a198735bSStefano Zampini ierr = ISDestroy(&col);CHKERRQ(ierr); 2705a198735bSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pc),&pcbddc->divudotp);CHKERRQ(ierr); 2706a198735bSStefano Zampini ierr = MatSetType(pcbddc->divudotp,MATIS);CHKERRQ(ierr); 2707a198735bSStefano Zampini ierr = MatSetSizes(pcbddc->divudotp,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 2708a198735bSStefano Zampini ierr = MatSetLocalToGlobalMapping(pcbddc->divudotp,rl2g,cl2g);CHKERRQ(ierr); 2709a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&rl2g);CHKERRQ(ierr); 2710a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cl2g);CHKERRQ(ierr); 2711a198735bSStefano Zampini ierr = MatISSetLocalMat(pcbddc->divudotp,loc_divudotp);CHKERRQ(ierr); 2712a198735bSStefano Zampini ierr = MatDestroy(&loc_divudotp);CHKERRQ(ierr); 27131ae86dd6SStefano Zampini ierr = MatAssemblyBegin(pcbddc->divudotp,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 27141ae86dd6SStefano Zampini ierr = MatAssemblyEnd(pcbddc->divudotp,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 27151ae86dd6SStefano Zampini } 27164edc6404Sstefano_zampini ierr = ISDestroy(&zerodiag_save);CHKERRQ(ierr); 2717b3afcdbeSStefano Zampini 2718b3afcdbeSStefano Zampini /* change of basis and p0 dofs */ 27194f1b2e48SStefano Zampini if (has_null_pressures) { 27204f1b2e48SStefano Zampini IS zerodiagc; 27214f1b2e48SStefano Zampini const PetscInt *idxs,*idxsc; 27224f1b2e48SStefano Zampini PetscInt i,s,*nnz; 27234f1b2e48SStefano Zampini 27244f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 2725339f8db1SStefano Zampini ierr = ISComplement(zerodiag,0,n,&zerodiagc);CHKERRQ(ierr); 2726339f8db1SStefano Zampini ierr = ISGetIndices(zerodiagc,&idxsc);CHKERRQ(ierr); 2727339f8db1SStefano Zampini /* local change of basis for pressures */ 2728339f8db1SStefano Zampini ierr = MatDestroy(&pcbddc->benign_change);CHKERRQ(ierr); 272997d764eeSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pcbddc->local_mat),&pcbddc->benign_change);CHKERRQ(ierr); 2730339f8db1SStefano Zampini ierr = MatSetType(pcbddc->benign_change,MATAIJ);CHKERRQ(ierr); 2731339f8db1SStefano Zampini ierr = MatSetSizes(pcbddc->benign_change,n,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 2732339f8db1SStefano Zampini ierr = PetscMalloc1(n,&nnz);CHKERRQ(ierr); 27334f1b2e48SStefano Zampini for (i=0;i<n-nz;i++) nnz[idxsc[i]] = 1; /* identity on velocities plus pressure dofs for non-singular subdomains */ 27344f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 27354f1b2e48SStefano Zampini PetscInt nzs,j; 27364f1b2e48SStefano Zampini 27374f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[i],&nzs);CHKERRQ(ierr); 27384f1b2e48SStefano Zampini ierr = ISGetIndices(zerodiag_subs[i],&idxs);CHKERRQ(ierr); 27394f1b2e48SStefano Zampini for (j=0;j<nzs-1;j++) nnz[idxs[j]] = 2; /* change on pressures */ 27404f1b2e48SStefano Zampini nnz[idxs[nzs-1]] = nzs; /* last local pressure dof in subdomain */ 27414f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiag_subs[i],&idxs);CHKERRQ(ierr); 27424f1b2e48SStefano Zampini } 2743339f8db1SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->benign_change,0,nnz);CHKERRQ(ierr); 2744339f8db1SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2745339f8db1SStefano Zampini /* set identity on velocities */ 2746339f8db1SStefano Zampini for (i=0;i<n-nz;i++) { 2747339f8db1SStefano Zampini ierr = MatSetValue(pcbddc->benign_change,idxsc[i],idxsc[i],1.,INSERT_VALUES);CHKERRQ(ierr); 2748339f8db1SStefano Zampini } 27494f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiagc,&idxsc);CHKERRQ(ierr); 27504f1b2e48SStefano Zampini ierr = ISDestroy(&zerodiagc);CHKERRQ(ierr); 27519f47a83aSStefano Zampini ierr = PetscFree3(pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx,pcbddc->benign_p0);CHKERRQ(ierr); 27524f1b2e48SStefano Zampini ierr = PetscMalloc3(pcbddc->benign_n,&pcbddc->benign_p0_lidx,pcbddc->benign_n,&pcbddc->benign_p0_gidx,pcbddc->benign_n,&pcbddc->benign_p0);CHKERRQ(ierr); 2753339f8db1SStefano Zampini /* set change on pressures */ 27544f1b2e48SStefano Zampini for (s=0;s<pcbddc->benign_n;s++) { 27554f1b2e48SStefano Zampini PetscScalar *array; 27564f1b2e48SStefano Zampini PetscInt nzs; 27574f1b2e48SStefano Zampini 27584f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[s],&nzs);CHKERRQ(ierr); 27594f1b2e48SStefano Zampini ierr = ISGetIndices(zerodiag_subs[s],&idxs);CHKERRQ(ierr); 27604f1b2e48SStefano Zampini for (i=0;i<nzs-1;i++) { 2761339f8db1SStefano Zampini PetscScalar vals[2]; 2762339f8db1SStefano Zampini PetscInt cols[2]; 2763339f8db1SStefano Zampini 2764339f8db1SStefano Zampini cols[0] = idxs[i]; 27654f1b2e48SStefano Zampini cols[1] = idxs[nzs-1]; 2766339f8db1SStefano Zampini vals[0] = 1.; 2767b0f5fe93SStefano Zampini vals[1] = 1.; 27684f1b2e48SStefano Zampini ierr = MatSetValues(pcbddc->benign_change,1,cols,2,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 2769339f8db1SStefano Zampini } 27704f1b2e48SStefano Zampini ierr = PetscMalloc1(nzs,&array);CHKERRQ(ierr); 27714f1b2e48SStefano Zampini for (i=0;i<nzs-1;i++) array[i] = -1.; 27724f1b2e48SStefano Zampini array[nzs-1] = 1.; 27734f1b2e48SStefano Zampini ierr = MatSetValues(pcbddc->benign_change,1,idxs+nzs-1,nzs,idxs,array,INSERT_VALUES);CHKERRQ(ierr); 27744f1b2e48SStefano Zampini /* store local idxs for p0 */ 27754f1b2e48SStefano Zampini pcbddc->benign_p0_lidx[s] = idxs[nzs-1]; 27764f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiag_subs[s],&idxs);CHKERRQ(ierr); 2777339f8db1SStefano Zampini ierr = PetscFree(array);CHKERRQ(ierr); 27784f1b2e48SStefano Zampini } 2779339f8db1SStefano Zampini ierr = MatAssemblyBegin(pcbddc->benign_change,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2780339f8db1SStefano Zampini ierr = MatAssemblyEnd(pcbddc->benign_change,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2781a3df083aSStefano Zampini /* project if needed */ 2782a3df083aSStefano Zampini if (pcbddc->benign_change_explicit) { 27831dd7afcfSStefano Zampini Mat M; 27841dd7afcfSStefano Zampini 27851dd7afcfSStefano Zampini ierr = MatPtAP(pcbddc->local_mat,pcbddc->benign_change,MAT_INITIAL_MATRIX,2.0,&M);CHKERRQ(ierr); 2786339f8db1SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 27871dd7afcfSStefano Zampini ierr = MatSeqAIJCompress(M,&pcbddc->local_mat);CHKERRQ(ierr); 27881dd7afcfSStefano Zampini ierr = MatDestroy(&M);CHKERRQ(ierr); 2789a3df083aSStefano Zampini } 27904f1b2e48SStefano Zampini /* store global idxs for p0 */ 27914f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingApply(pc->pmat->rmap->mapping,pcbddc->benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx);CHKERRQ(ierr); 2792339f8db1SStefano Zampini } 2793ca92afb2SStefano Zampini pcbddc->benign_zerodiag_subs = zerodiag_subs; 27944f1b2e48SStefano Zampini ierr = ISDestroy(&pressures);CHKERRQ(ierr); 2795b0f5fe93SStefano Zampini 2796b0f5fe93SStefano Zampini /* determines if the coarse solver will be singular or not */ 2797b0f5fe93SStefano Zampini ierr = MPI_Allreduce(&have_null,&pcbddc->benign_null,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 279827b6a85dSStefano Zampini /* determines if the problem has subdomains with 0 pressure block */ 279927b6a85dSStefano Zampini ierr = MPI_Allreduce(&have_null,&pcbddc->benign_have_null,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 2800339f8db1SStefano Zampini *zerodiaglocal = zerodiag; 2801339f8db1SStefano Zampini PetscFunctionReturn(0); 2802339f8db1SStefano Zampini } 2803339f8db1SStefano Zampini 2804015636ebSStefano Zampini PetscErrorCode PCBDDCBenignGetOrSetP0(PC pc, Vec v, PetscBool get) 2805efc2fbd9SStefano Zampini { 2806efc2fbd9SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 2807de9d7bd0SStefano Zampini PetscScalar *array; 2808efc2fbd9SStefano Zampini PetscErrorCode ierr; 2809efc2fbd9SStefano Zampini 2810efc2fbd9SStefano Zampini PetscFunctionBegin; 2811efc2fbd9SStefano Zampini if (!pcbddc->benign_sf) { 2812efc2fbd9SStefano Zampini ierr = PetscSFCreate(PetscObjectComm((PetscObject)pc),&pcbddc->benign_sf);CHKERRQ(ierr); 28134f1b2e48SStefano Zampini ierr = PetscSFSetGraphLayout(pcbddc->benign_sf,pc->pmat->rmap,pcbddc->benign_n,NULL,PETSC_OWN_POINTER,pcbddc->benign_p0_gidx);CHKERRQ(ierr); 2814efc2fbd9SStefano Zampini } 2815de9d7bd0SStefano Zampini if (get) { 2816efc2fbd9SStefano Zampini ierr = VecGetArrayRead(v,(const PetscScalar**)&array);CHKERRQ(ierr); 28174f1b2e48SStefano Zampini ierr = PetscSFBcastBegin(pcbddc->benign_sf,MPIU_SCALAR,array,pcbddc->benign_p0);CHKERRQ(ierr); 28184f1b2e48SStefano Zampini ierr = PetscSFBcastEnd(pcbddc->benign_sf,MPIU_SCALAR,array,pcbddc->benign_p0);CHKERRQ(ierr); 2819efc2fbd9SStefano Zampini ierr = VecRestoreArrayRead(v,(const PetscScalar**)&array);CHKERRQ(ierr); 2820de9d7bd0SStefano Zampini } else { 2821de9d7bd0SStefano Zampini ierr = VecGetArray(v,&array);CHKERRQ(ierr); 2822de9d7bd0SStefano Zampini ierr = PetscSFReduceBegin(pcbddc->benign_sf,MPIU_SCALAR,pcbddc->benign_p0,array,MPIU_REPLACE);CHKERRQ(ierr); 2823de9d7bd0SStefano Zampini ierr = PetscSFReduceEnd(pcbddc->benign_sf,MPIU_SCALAR,pcbddc->benign_p0,array,MPIU_REPLACE);CHKERRQ(ierr); 2824de9d7bd0SStefano Zampini ierr = VecRestoreArray(v,&array);CHKERRQ(ierr); 2825efc2fbd9SStefano Zampini } 2826efc2fbd9SStefano Zampini PetscFunctionReturn(0); 2827efc2fbd9SStefano Zampini } 2828efc2fbd9SStefano Zampini 2829c263805aSStefano Zampini PetscErrorCode PCBDDCBenignPopOrPushB0(PC pc, PetscBool pop) 2830c263805aSStefano Zampini { 2831c263805aSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 2832c263805aSStefano Zampini PetscErrorCode ierr; 2833c263805aSStefano Zampini 2834c263805aSStefano Zampini PetscFunctionBegin; 2835c263805aSStefano Zampini /* TODO: add error checking 2836c263805aSStefano Zampini - avoid nested pop (or push) calls. 2837c263805aSStefano Zampini - cannot push before pop. 28381c604dc7SStefano Zampini - cannot call this if pcbddc->local_mat is NULL 2839c263805aSStefano Zampini */ 28404f1b2e48SStefano Zampini if (!pcbddc->benign_n) { 2841efc2fbd9SStefano Zampini PetscFunctionReturn(0); 2842efc2fbd9SStefano Zampini } 2843c263805aSStefano Zampini if (pop) { 2844a3df083aSStefano Zampini if (pcbddc->benign_change_explicit) { 28454f1b2e48SStefano Zampini IS is_p0; 28464f1b2e48SStefano Zampini MatReuse reuse; 2847c263805aSStefano Zampini 2848c263805aSStefano Zampini /* extract B_0 */ 28494f1b2e48SStefano Zampini reuse = MAT_INITIAL_MATRIX; 28504f1b2e48SStefano Zampini if (pcbddc->benign_B0) { 28514f1b2e48SStefano Zampini reuse = MAT_REUSE_MATRIX; 28524f1b2e48SStefano Zampini } 28534f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->benign_n,pcbddc->benign_p0_lidx,PETSC_COPY_VALUES,&is_p0);CHKERRQ(ierr); 28547dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,is_p0,NULL,reuse,&pcbddc->benign_B0);CHKERRQ(ierr); 2855c263805aSStefano Zampini /* remove rows and cols from local problem */ 2856c263805aSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_KEEP_NONZERO_PATTERN,PETSC_TRUE);CHKERRQ(ierr); 285797d764eeSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 28584f1b2e48SStefano Zampini ierr = MatZeroRowsColumnsIS(pcbddc->local_mat,is_p0,1.0,NULL,NULL);CHKERRQ(ierr); 28594f1b2e48SStefano Zampini ierr = ISDestroy(&is_p0);CHKERRQ(ierr); 2860a3df083aSStefano Zampini } else { 2861a3df083aSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2862a3df083aSStefano Zampini PetscScalar *vals; 2863a3df083aSStefano Zampini PetscInt i,n,*idxs_ins; 2864a3df083aSStefano Zampini 2865a3df083aSStefano Zampini ierr = VecGetLocalSize(matis->y,&n);CHKERRQ(ierr); 2866a3df083aSStefano Zampini ierr = PetscMalloc2(n,&idxs_ins,n,&vals);CHKERRQ(ierr); 2867a3df083aSStefano Zampini if (!pcbddc->benign_B0) { 28680b5adadeSStefano Zampini PetscInt *nnz; 2869a3df083aSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pcbddc->local_mat),&pcbddc->benign_B0);CHKERRQ(ierr); 2870a3df083aSStefano Zampini ierr = MatSetType(pcbddc->benign_B0,MATAIJ);CHKERRQ(ierr); 2871a3df083aSStefano Zampini ierr = MatSetSizes(pcbddc->benign_B0,pcbddc->benign_n,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 2872331e053bSStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&nnz);CHKERRQ(ierr); 2873331e053bSStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 2874331e053bSStefano Zampini ierr = ISGetLocalSize(pcbddc->benign_zerodiag_subs[i],&nnz[i]);CHKERRQ(ierr); 2875331e053bSStefano Zampini nnz[i] = n - nnz[i]; 2876331e053bSStefano Zampini } 2877331e053bSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->benign_B0,0,nnz);CHKERRQ(ierr); 2878331e053bSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2879331e053bSStefano Zampini } 2880a3df083aSStefano Zampini 2881a3df083aSStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 2882a3df083aSStefano Zampini PetscScalar *array; 2883a3df083aSStefano Zampini PetscInt *idxs,j,nz,cum; 2884a3df083aSStefano Zampini 2885a3df083aSStefano Zampini ierr = VecSet(matis->x,0.);CHKERRQ(ierr); 2886a3df083aSStefano Zampini ierr = ISGetLocalSize(pcbddc->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 2887a3df083aSStefano Zampini ierr = ISGetIndices(pcbddc->benign_zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 2888a3df083aSStefano Zampini for (j=0;j<nz;j++) vals[j] = 1.; 2889a3df083aSStefano Zampini ierr = VecSetValues(matis->x,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 2890a3df083aSStefano Zampini ierr = VecAssemblyBegin(matis->x);CHKERRQ(ierr); 2891a3df083aSStefano Zampini ierr = VecAssemblyEnd(matis->x);CHKERRQ(ierr); 2892a3df083aSStefano Zampini ierr = VecSet(matis->y,0.);CHKERRQ(ierr); 2893a3df083aSStefano Zampini ierr = MatMult(matis->A,matis->x,matis->y);CHKERRQ(ierr); 2894a3df083aSStefano Zampini ierr = VecGetArray(matis->y,&array);CHKERRQ(ierr); 2895a3df083aSStefano Zampini cum = 0; 2896a3df083aSStefano Zampini for (j=0;j<n;j++) { 289722db5ddcSStefano Zampini if (PetscUnlikely(PetscAbsScalar(array[j]) > PETSC_SMALL)) { 2898a3df083aSStefano Zampini vals[cum] = array[j]; 2899a3df083aSStefano Zampini idxs_ins[cum] = j; 2900a3df083aSStefano Zampini cum++; 2901a3df083aSStefano Zampini } 2902a3df083aSStefano Zampini } 2903a3df083aSStefano Zampini ierr = MatSetValues(pcbddc->benign_B0,1,&i,cum,idxs_ins,vals,INSERT_VALUES);CHKERRQ(ierr); 2904a3df083aSStefano Zampini ierr = VecRestoreArray(matis->y,&array);CHKERRQ(ierr); 2905a3df083aSStefano Zampini ierr = ISRestoreIndices(pcbddc->benign_zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 2906a3df083aSStefano Zampini } 2907a3df083aSStefano Zampini ierr = MatAssemblyBegin(pcbddc->benign_B0,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2908a3df083aSStefano Zampini ierr = MatAssemblyEnd(pcbddc->benign_B0,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2909a3df083aSStefano Zampini ierr = PetscFree2(idxs_ins,vals);CHKERRQ(ierr); 2910a3df083aSStefano Zampini } 2911c263805aSStefano Zampini } else { /* push */ 2912a3df083aSStefano Zampini if (pcbddc->benign_change_explicit) { 29134f1b2e48SStefano Zampini PetscInt i; 29144f1b2e48SStefano Zampini 29154f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 29164f1b2e48SStefano Zampini PetscScalar *B0_vals; 29174f1b2e48SStefano Zampini PetscInt *B0_cols,B0_ncol; 29184f1b2e48SStefano Zampini 29194f1b2e48SStefano Zampini ierr = MatGetRow(pcbddc->benign_B0,i,&B0_ncol,(const PetscInt**)&B0_cols,(const PetscScalar**)&B0_vals);CHKERRQ(ierr); 29204f1b2e48SStefano Zampini ierr = MatSetValues(pcbddc->local_mat,1,pcbddc->benign_p0_lidx+i,B0_ncol,B0_cols,B0_vals,INSERT_VALUES);CHKERRQ(ierr); 29217b034428SStefano Zampini ierr = MatSetValues(pcbddc->local_mat,B0_ncol,B0_cols,1,pcbddc->benign_p0_lidx+i,B0_vals,INSERT_VALUES);CHKERRQ(ierr); 29224f1b2e48SStefano Zampini ierr = MatSetValue(pcbddc->local_mat,pcbddc->benign_p0_lidx[i],pcbddc->benign_p0_lidx[i],0.0,INSERT_VALUES);CHKERRQ(ierr); 29234f1b2e48SStefano Zampini ierr = MatRestoreRow(pcbddc->benign_B0,i,&B0_ncol,(const PetscInt**)&B0_cols,(const PetscScalar**)&B0_vals);CHKERRQ(ierr); 29244f1b2e48SStefano Zampini } 2925c263805aSStefano Zampini ierr = MatAssemblyBegin(pcbddc->local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2926c263805aSStefano Zampini ierr = MatAssemblyEnd(pcbddc->local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2927a3df083aSStefano Zampini } else { 2928a3df083aSStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Cannot push B0!\n"); 2929a3df083aSStefano Zampini } 2930c263805aSStefano Zampini } 2931c263805aSStefano Zampini PetscFunctionReturn(0); 2932c263805aSStefano Zampini } 2933c263805aSStefano Zampini 293408122e43SStefano Zampini PetscErrorCode PCBDDCAdaptiveSelection(PC pc) 2935b1b3d7a2SStefano Zampini { 2936b1b3d7a2SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 293708122e43SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 293808122e43SStefano Zampini PetscBLASInt B_dummyint,B_neigs,B_ierr,B_lwork; 293908122e43SStefano Zampini PetscBLASInt *B_iwork,*B_ifail; 294008122e43SStefano Zampini PetscScalar *work,lwork; 294108122e43SStefano Zampini PetscScalar *St,*S,*eigv; 294208122e43SStefano Zampini PetscScalar *Sarray,*Starray; 294308122e43SStefano Zampini PetscReal *eigs,thresh; 29441b968477SStefano Zampini PetscInt i,nmax,nmin,nv,cum,mss,cum2,cumarray,maxneigs; 2945f6f667cfSStefano Zampini PetscBool allocated_S_St; 294608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 294708122e43SStefano Zampini PetscReal *rwork; 294808122e43SStefano Zampini #endif 2949b1b3d7a2SStefano Zampini PetscErrorCode ierr; 2950b1b3d7a2SStefano Zampini 2951b1b3d7a2SStefano Zampini PetscFunctionBegin; 2952b334f244SStefano Zampini if (!sub_schurs) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Adaptive selection of constraints requires SubSchurs data"); 2953af25d912SStefano Zampini if (!sub_schurs->schur_explicit) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Adaptive selection of constraints requires MUMPS and/or MKL_CPARDISO"); 2954d750e150Sstefano_zampini if (sub_schurs->n_subs && (!sub_schurs->is_hermitian || !sub_schurs->is_posdef)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Adaptive selection not yet implemented for general matrix pencils (herm %d, posdef %d)\nRerun with -sub_schurs_hermitian 1 -sub_schurs_posdef 1 if the problem is SPD",sub_schurs->is_hermitian,sub_schurs->is_posdef); 295506a4e24aSStefano Zampini 2956fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 2957fd14bc51SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 2958fd14bc51SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 2959fd14bc51SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check adaptive selection of constraints\n");CHKERRQ(ierr); 29601575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 2961fd14bc51SStefano Zampini } 2962fd14bc51SStefano Zampini 2963e496cd5dSStefano Zampini if (pcbddc->dbg_flag) { 2964e496cd5dSStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d cc %d (%d,%d).\n",PetscGlobalRank,sub_schurs->n_subs,sub_schurs->is_hermitian,sub_schurs->is_posdef); 2965e496cd5dSStefano Zampini } 2966e496cd5dSStefano Zampini 296708122e43SStefano Zampini /* max size of subsets */ 296808122e43SStefano Zampini mss = 0; 296908122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 297008122e43SStefano Zampini PetscInt subset_size; 2971862806e4SStefano Zampini 297208122e43SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 297308122e43SStefano Zampini mss = PetscMax(mss,subset_size); 297408122e43SStefano Zampini } 297508122e43SStefano Zampini 297608122e43SStefano Zampini /* min/max and threshold */ 297708122e43SStefano Zampini nmax = pcbddc->adaptive_nmax > 0 ? pcbddc->adaptive_nmax : mss; 2978f6f667cfSStefano Zampini nmin = pcbddc->adaptive_nmin > 0 ? pcbddc->adaptive_nmin : 0; 297908122e43SStefano Zampini nmax = PetscMax(nmin,nmax); 2980f6f667cfSStefano Zampini allocated_S_St = PETSC_FALSE; 2981f6f667cfSStefano Zampini if (nmin) { 2982f6f667cfSStefano Zampini allocated_S_St = PETSC_TRUE; 2983f6f667cfSStefano Zampini } 298408122e43SStefano Zampini 298508122e43SStefano Zampini /* allocate lapack workspace */ 298608122e43SStefano Zampini cum = cum2 = 0; 298708122e43SStefano Zampini maxneigs = 0; 298808122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 298908122e43SStefano Zampini PetscInt n,subset_size; 2990f6f667cfSStefano Zampini 299108122e43SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 299208122e43SStefano Zampini n = PetscMin(subset_size,nmax); 29939162d606SStefano Zampini cum += subset_size; 29949162d606SStefano Zampini cum2 += subset_size*n; 299508122e43SStefano Zampini maxneigs = PetscMax(maxneigs,n); 299608122e43SStefano Zampini } 299708122e43SStefano Zampini if (mss) { 29989ab7bb16SStefano Zampini if (sub_schurs->is_hermitian && sub_schurs->is_posdef) { 299908122e43SStefano Zampini PetscBLASInt B_itype = 1; 300008122e43SStefano Zampini PetscBLASInt B_N = mss; 30014c6709b3SStefano Zampini PetscReal zero = 0.0; 30024c6709b3SStefano Zampini PetscReal eps = 0.0; /* dlamch? */ 300308122e43SStefano Zampini 300408122e43SStefano Zampini B_lwork = -1; 300508122e43SStefano Zampini S = NULL; 300608122e43SStefano Zampini St = NULL; 3007a58a30b4SStefano Zampini eigs = NULL; 3008a58a30b4SStefano Zampini eigv = NULL; 3009a58a30b4SStefano Zampini B_iwork = NULL; 3010a58a30b4SStefano Zampini B_ifail = NULL; 3011d1710679SStefano Zampini #if defined(PETSC_USE_COMPLEX) 3012d1710679SStefano Zampini rwork = NULL; 3013d1710679SStefano Zampini #endif 30148bec7fa6SStefano Zampini thresh = 1.0; 301508122e43SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 301608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 301708122e43SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&zero,&thresh,&B_dummyint,&B_dummyint,&eps,&B_neigs,eigs,eigv,&B_N,&lwork,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 301808122e43SStefano Zampini #else 301908122e43SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&zero,&thresh,&B_dummyint,&B_dummyint,&eps,&B_neigs,eigs,eigv,&B_N,&lwork,&B_lwork,B_iwork,B_ifail,&B_ierr)); 302008122e43SStefano Zampini #endif 302108122e43SStefano Zampini if (B_ierr != 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYGVX Lapack routine %d",(int)B_ierr); 302208122e43SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 302308122e43SStefano Zampini } else { 302408122e43SStefano Zampini /* TODO */ 302508122e43SStefano Zampini } 302608122e43SStefano Zampini } else { 302708122e43SStefano Zampini lwork = 0; 302808122e43SStefano Zampini } 302908122e43SStefano Zampini 303008122e43SStefano Zampini nv = 0; 3031d62866d3SStefano Zampini if (sub_schurs->is_vertices && pcbddc->use_vertices) { /* complement set of active subsets, each entry is a vertex (boundary made by active subsets, vertices and dirichlet dofs) */ 3032d62866d3SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_vertices,&nv);CHKERRQ(ierr); 303308122e43SStefano Zampini } 30344c6709b3SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&B_lwork);CHKERRQ(ierr); 3035f6f667cfSStefano Zampini if (allocated_S_St) { 3036f6f667cfSStefano Zampini ierr = PetscMalloc2(mss*mss,&S,mss*mss,&St);CHKERRQ(ierr); 3037f6f667cfSStefano Zampini } 3038f6f667cfSStefano Zampini ierr = PetscMalloc5(mss*mss,&eigv,mss,&eigs,B_lwork,&work,5*mss,&B_iwork,mss,&B_ifail);CHKERRQ(ierr); 303908122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 304008122e43SStefano Zampini ierr = PetscMalloc1(7*mss,&rwork);CHKERRQ(ierr); 304108122e43SStefano Zampini #endif 30429162d606SStefano Zampini ierr = PetscMalloc5(nv+sub_schurs->n_subs,&pcbddc->adaptive_constraints_n, 30439162d606SStefano Zampini nv+sub_schurs->n_subs+1,&pcbddc->adaptive_constraints_idxs_ptr, 30449162d606SStefano Zampini nv+sub_schurs->n_subs+1,&pcbddc->adaptive_constraints_data_ptr, 304508122e43SStefano Zampini nv+cum,&pcbddc->adaptive_constraints_idxs, 30469162d606SStefano Zampini nv+cum2,&pcbddc->adaptive_constraints_data);CHKERRQ(ierr); 304708122e43SStefano Zampini ierr = PetscMemzero(pcbddc->adaptive_constraints_n,(nv+sub_schurs->n_subs)*sizeof(PetscInt));CHKERRQ(ierr); 304808122e43SStefano Zampini 304908122e43SStefano Zampini maxneigs = 0; 305072b8c272SStefano Zampini cum = cumarray = 0; 30519162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr[0] = 0; 30529162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr[0] = 0; 3053d62866d3SStefano Zampini if (sub_schurs->is_vertices && pcbddc->use_vertices) { 305408122e43SStefano Zampini const PetscInt *idxs; 305508122e43SStefano Zampini 3056d62866d3SStefano Zampini ierr = ISGetIndices(sub_schurs->is_vertices,&idxs);CHKERRQ(ierr); 305708122e43SStefano Zampini for (cum=0;cum<nv;cum++) { 305808122e43SStefano Zampini pcbddc->adaptive_constraints_n[cum] = 1; 305908122e43SStefano Zampini pcbddc->adaptive_constraints_idxs[cum] = idxs[cum]; 306008122e43SStefano Zampini pcbddc->adaptive_constraints_data[cum] = 1.0; 30619162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr[cum+1] = pcbddc->adaptive_constraints_idxs_ptr[cum]+1; 30629162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr[cum+1] = pcbddc->adaptive_constraints_data_ptr[cum]+1; 306308122e43SStefano Zampini } 3064d62866d3SStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_vertices,&idxs);CHKERRQ(ierr); 306508122e43SStefano Zampini } 306608122e43SStefano Zampini 306708122e43SStefano Zampini if (mss) { /* multilevel */ 306808122e43SStefano Zampini ierr = MatSeqAIJGetArray(sub_schurs->sum_S_Ej_inv_all,&Sarray);CHKERRQ(ierr); 306908122e43SStefano Zampini ierr = MatSeqAIJGetArray(sub_schurs->sum_S_Ej_tilda_all,&Starray);CHKERRQ(ierr); 307008122e43SStefano Zampini } 307108122e43SStefano Zampini 3072ffd830a3SStefano Zampini thresh = pcbddc->adaptive_threshold; 307308122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 307408122e43SStefano Zampini const PetscInt *idxs; 30759d54b7f4SStefano Zampini PetscReal upper,lower; 3076862806e4SStefano Zampini PetscInt j,subset_size,eigs_start = 0; 307708122e43SStefano Zampini PetscBLASInt B_N; 3078aff50787SStefano Zampini PetscBool same_data = PETSC_FALSE; 307908122e43SStefano Zampini 30809d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) { 30819d54b7f4SStefano Zampini upper = PETSC_MAX_REAL; 30829d54b7f4SStefano Zampini lower = thresh; 30839d54b7f4SStefano Zampini } else { 30849d54b7f4SStefano Zampini upper = 1./thresh; 30859d54b7f4SStefano Zampini lower = 0.; 30869d54b7f4SStefano Zampini } 3087862806e4SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 3088ffd830a3SStefano Zampini ierr = ISGetIndices(sub_schurs->is_subs[i],&idxs);CHKERRQ(ierr); 3089f6f667cfSStefano Zampini ierr = PetscBLASIntCast(subset_size,&B_N);CHKERRQ(ierr); 3090f6f667cfSStefano Zampini if (allocated_S_St) { /* S and S_t should be copied since we could need them later */ 30919ab7bb16SStefano Zampini if (sub_schurs->is_hermitian) { 3092aff50787SStefano Zampini PetscInt j,k; 3093aff50787SStefano Zampini if (sub_schurs->n_subs == 1) { /* zeroing memory to use PetscMemcmp later */ 3094aff50787SStefano Zampini ierr = PetscMemzero(S,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 3095aff50787SStefano Zampini ierr = PetscMemzero(St,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 309608122e43SStefano Zampini } 309708122e43SStefano Zampini for (j=0;j<subset_size;j++) { 3098aff50787SStefano Zampini for (k=j;k<subset_size;k++) { 3099aff50787SStefano Zampini S [j*subset_size+k] = Sarray [cumarray+j*subset_size+k]; 3100aff50787SStefano Zampini St[j*subset_size+k] = Starray[cumarray+j*subset_size+k]; 3101aff50787SStefano Zampini } 310208122e43SStefano Zampini } 310308122e43SStefano Zampini } else { 310408122e43SStefano Zampini ierr = PetscMemcpy(S,Sarray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 310508122e43SStefano Zampini ierr = PetscMemcpy(St,Starray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 310608122e43SStefano Zampini } 31078bec7fa6SStefano Zampini } else { 3108f6f667cfSStefano Zampini S = Sarray + cumarray; 3109f6f667cfSStefano Zampini St = Starray + cumarray; 31108bec7fa6SStefano Zampini } 3111aff50787SStefano Zampini /* see if we can save some work */ 3112b7ab4a40SStefano Zampini if (sub_schurs->n_subs == 1 && pcbddc->use_deluxe_scaling) { 3113aff50787SStefano Zampini ierr = PetscMemcmp(S,St,subset_size*subset_size*sizeof(PetscScalar),&same_data);CHKERRQ(ierr); 3114aff50787SStefano Zampini } 3115aff50787SStefano Zampini 3116b7ab4a40SStefano Zampini if (same_data && !sub_schurs->change) { /* there's no need of constraints here */ 3117aff50787SStefano Zampini B_neigs = 0; 3118aff50787SStefano Zampini } else { 31199ab7bb16SStefano Zampini if (sub_schurs->is_hermitian && sub_schurs->is_posdef) { 312008122e43SStefano Zampini PetscBLASInt B_itype = 1; 3121f6f667cfSStefano Zampini PetscBLASInt B_IL, B_IU; 31224c6709b3SStefano Zampini PetscReal eps = -1.0; /* dlamch? */ 31239552c7c7SStefano Zampini PetscInt nmin_s; 3124b7ab4a40SStefano Zampini PetscBool compute_range = PETSC_FALSE; 312508122e43SStefano Zampini 3126fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3127eee23b56SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Computing for sub %d/%d size %d count %d fid %d.\n",i,sub_schurs->n_subs,subset_size,pcbddc->mat_graph->count[idxs[0]]+1,pcbddc->mat_graph->which_dof[idxs[0]]); 3128fd14bc51SStefano Zampini } 3129d16cbb6bSStefano Zampini 3130b7ab4a40SStefano Zampini compute_range = PETSC_FALSE; 3131b7ab4a40SStefano Zampini if (thresh > 1.+PETSC_SMALL && !same_data) { 3132b7ab4a40SStefano Zampini compute_range = PETSC_TRUE; 3133b7ab4a40SStefano Zampini } 3134b7ab4a40SStefano Zampini 313508122e43SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 3136b7ab4a40SStefano Zampini if (compute_range) { 3137d16cbb6bSStefano Zampini 3138d16cbb6bSStefano Zampini /* ask for eigenvalues larger than thresh */ 313908122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 31409d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 314108122e43SStefano Zampini #else 31429d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr)); 314308122e43SStefano Zampini #endif 3144b7ab4a40SStefano Zampini } else if (!same_data) { 3145d16cbb6bSStefano Zampini B_IU = PetscMax(1,PetscMin(B_N,nmax)); 3146d16cbb6bSStefano Zampini B_IL = 1; 3147d16cbb6bSStefano Zampini #if defined(PETSC_USE_COMPLEX) 31489d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 3149d16cbb6bSStefano Zampini #else 31509d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr)); 3151d16cbb6bSStefano Zampini #endif 3152b03ebc13SStefano Zampini } else { /* same_data is true, so just get the adaptive functional requested by the user */ 3153b7ab4a40SStefano Zampini PetscInt k; 3154b7ab4a40SStefano Zampini if (!sub_schurs->change_primal_sub) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen"); 3155b7ab4a40SStefano Zampini ierr = ISGetLocalSize(sub_schurs->change_primal_sub[i],&nmax);CHKERRQ(ierr); 3156b7ab4a40SStefano Zampini ierr = PetscBLASIntCast(nmax,&B_neigs);CHKERRQ(ierr); 3157b7ab4a40SStefano Zampini nmin = nmax; 3158b7ab4a40SStefano Zampini ierr = PetscMemzero(eigv,subset_size*nmax*sizeof(PetscScalar));CHKERRQ(ierr); 3159b7ab4a40SStefano Zampini for (k=0;k<nmax;k++) { 3160b7ab4a40SStefano Zampini eigs[k] = 1./PETSC_SMALL; 3161b7ab4a40SStefano Zampini eigv[k*(subset_size+1)] = 1.0; 3162b7ab4a40SStefano Zampini } 3163d16cbb6bSStefano Zampini } 316408122e43SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 316508122e43SStefano Zampini if (B_ierr) { 31666c4ed002SBarry Smith if (B_ierr < 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: illegal value for argument %d",-(int)B_ierr); 31676c4ed002SBarry Smith else if (B_ierr <= B_N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: %d eigenvalues failed to converge",(int)B_ierr); 31686c4ed002SBarry Smith else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: leading minor of order %d is not positive definite",(int)B_ierr-B_N-1); 316908122e43SStefano Zampini } 317008122e43SStefano Zampini 317108122e43SStefano Zampini if (B_neigs > nmax) { 3172fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3173fd14bc51SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," found %d eigs, more than maximum required %d.\n",B_neigs,nmax); 3174fd14bc51SStefano Zampini } 31759d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) eigs_start = B_neigs -nmax; 317608122e43SStefano Zampini B_neigs = nmax; 317708122e43SStefano Zampini } 317808122e43SStefano Zampini 31799552c7c7SStefano Zampini nmin_s = PetscMin(nmin,B_N); 31809552c7c7SStefano Zampini if (B_neigs < nmin_s) { 318108122e43SStefano Zampini PetscBLASInt B_neigs2; 318208122e43SStefano Zampini 31839d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) { 3184f6f667cfSStefano Zampini B_IL = B_N - nmin_s + 1; 31859d54b7f4SStefano Zampini B_IU = B_N - B_neigs; 31869d54b7f4SStefano Zampini } else { 31879d54b7f4SStefano Zampini B_IL = B_neigs + 1; 31889d54b7f4SStefano Zampini B_IU = nmin_s; 31899d54b7f4SStefano Zampini } 3190fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3191fd14bc51SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," found %d eigs, less than minimum required %d. Asking for %d to %d incl (fortran like)\n",B_neigs,nmin,B_IL,B_IU); 3192fd14bc51SStefano Zampini } 31939ab7bb16SStefano Zampini if (sub_schurs->is_hermitian) { 31941ae86dd6SStefano Zampini PetscInt j,k; 319508122e43SStefano Zampini for (j=0;j<subset_size;j++) { 31961ae86dd6SStefano Zampini for (k=j;k<subset_size;k++) { 31971ae86dd6SStefano Zampini S [j*subset_size+k] = Sarray [cumarray+j*subset_size+k]; 31981ae86dd6SStefano Zampini St[j*subset_size+k] = Starray[cumarray+j*subset_size+k]; 319908122e43SStefano Zampini } 320008122e43SStefano Zampini } 320108122e43SStefano Zampini } else { 320208122e43SStefano Zampini ierr = PetscMemcpy(S,Sarray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 320308122e43SStefano Zampini ierr = PetscMemcpy(St,Starray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 320408122e43SStefano Zampini } 320508122e43SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 320608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 32079d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs2,eigs+B_neigs,eigv+B_neigs*subset_size,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 320808122e43SStefano Zampini #else 32099d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs2,eigs+B_neigs,eigv+B_neigs*subset_size,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr)); 321008122e43SStefano Zampini #endif 321108122e43SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 321208122e43SStefano Zampini B_neigs += B_neigs2; 321308122e43SStefano Zampini } 321408122e43SStefano Zampini if (B_ierr) { 32156c4ed002SBarry Smith if (B_ierr < 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: illegal value for argument %d",-(int)B_ierr); 32166c4ed002SBarry Smith else if (B_ierr <= B_N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: %d eigenvalues failed to converge",(int)B_ierr); 32176c4ed002SBarry Smith else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: leading minor of order %d is not positive definite",(int)B_ierr-B_N-1); 321808122e43SStefano Zampini } 3219fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3220ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," -> Got %d eigs\n",B_neigs);CHKERRQ(ierr); 322108122e43SStefano Zampini for (j=0;j<B_neigs;j++) { 322208122e43SStefano Zampini if (eigs[j] == 0.0) { 3223ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," Inf\n");CHKERRQ(ierr); 322408122e43SStefano Zampini } else { 32259d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) { 3226ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.6e\n",eigs[j+eigs_start]);CHKERRQ(ierr); 32279d54b7f4SStefano Zampini } else { 32289d54b7f4SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.6e\n",1./eigs[j+eigs_start]);CHKERRQ(ierr); 32299d54b7f4SStefano Zampini } 3230fd14bc51SStefano Zampini } 323108122e43SStefano Zampini } 323208122e43SStefano Zampini } 323308122e43SStefano Zampini } else { 323408122e43SStefano Zampini /* TODO */ 323508122e43SStefano Zampini } 3236aff50787SStefano Zampini } 32376c3e6151SStefano Zampini /* change the basis back to the original one */ 32386c3e6151SStefano Zampini if (sub_schurs->change) { 323972b8c272SStefano Zampini Mat change,phi,phit; 32406c3e6151SStefano Zampini 32416c3e6151SStefano Zampini if (pcbddc->dbg_flag > 1) { 32426c3e6151SStefano Zampini PetscInt ii; 32436c3e6151SStefano Zampini for (ii=0;ii<B_neigs;ii++) { 32446c3e6151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," -> Eigenvector (old basis) %d/%d (%d)\n",ii,B_neigs,B_N);CHKERRQ(ierr); 32456c3e6151SStefano Zampini for (j=0;j<B_N;j++) { 3246684229deSStefano Zampini #if defined(PETSC_USE_COMPLEX) 3247684229deSStefano Zampini PetscReal r = PetscRealPart(eigv[(ii+eigs_start)*subset_size+j]); 3248684229deSStefano Zampini PetscReal c = PetscImaginaryPart(eigv[(ii+eigs_start)*subset_size+j]); 3249684229deSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e + %1.4e i\n",r,c);CHKERRQ(ierr); 3250684229deSStefano Zampini #else 32516c3e6151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e\n",eigv[(ii+eigs_start)*subset_size+j]);CHKERRQ(ierr); 3252684229deSStefano Zampini #endif 32536c3e6151SStefano Zampini } 32546c3e6151SStefano Zampini } 32556c3e6151SStefano Zampini } 325672b8c272SStefano Zampini ierr = KSPGetOperators(sub_schurs->change[i],&change,NULL);CHKERRQ(ierr); 32576c3e6151SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,subset_size,B_neigs,eigv+eigs_start*subset_size,&phit);CHKERRQ(ierr); 325872b8c272SStefano Zampini ierr = MatMatMult(change,phit,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&phi);CHKERRQ(ierr); 32596c3e6151SStefano Zampini ierr = MatCopy(phi,phit,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 32606c3e6151SStefano Zampini ierr = MatDestroy(&phit);CHKERRQ(ierr); 32616c3e6151SStefano Zampini ierr = MatDestroy(&phi);CHKERRQ(ierr); 32626c3e6151SStefano Zampini } 32638bec7fa6SStefano Zampini maxneigs = PetscMax(B_neigs,maxneigs); 32648bec7fa6SStefano Zampini pcbddc->adaptive_constraints_n[i+nv] = B_neigs; 32659162d606SStefano Zampini if (B_neigs) { 32669162d606SStefano Zampini ierr = PetscMemcpy(pcbddc->adaptive_constraints_data+pcbddc->adaptive_constraints_data_ptr[cum],eigv+eigs_start*subset_size,B_neigs*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 3267fd14bc51SStefano Zampini 3268fd14bc51SStefano Zampini if (pcbddc->dbg_flag > 1) { 32699552c7c7SStefano Zampini PetscInt ii; 32709552c7c7SStefano Zampini for (ii=0;ii<B_neigs;ii++) { 3271ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," -> Eigenvector %d/%d (%d)\n",ii,B_neigs,B_N);CHKERRQ(ierr); 32729552c7c7SStefano Zampini for (j=0;j<B_N;j++) { 3273ac47001eSStefano Zampini #if defined(PETSC_USE_COMPLEX) 3274ac47001eSStefano Zampini PetscReal r = PetscRealPart(pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]); 3275ac47001eSStefano Zampini PetscReal c = PetscImaginaryPart(pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]); 3276ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e + %1.4e i\n",r,c);CHKERRQ(ierr); 3277ac47001eSStefano Zampini #else 3278ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e\n",pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]);CHKERRQ(ierr); 3279ac47001eSStefano Zampini #endif 32809552c7c7SStefano Zampini } 32819552c7c7SStefano Zampini } 3282fd14bc51SStefano Zampini } 32839162d606SStefano Zampini ierr = PetscMemcpy(pcbddc->adaptive_constraints_idxs+pcbddc->adaptive_constraints_idxs_ptr[cum],idxs,subset_size*sizeof(PetscInt));CHKERRQ(ierr); 32849162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr[cum+1] = pcbddc->adaptive_constraints_idxs_ptr[cum] + subset_size; 32859162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr[cum+1] = pcbddc->adaptive_constraints_data_ptr[cum] + subset_size*B_neigs; 32869162d606SStefano Zampini cum++; 328708122e43SStefano Zampini } 328808122e43SStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_subs[i],&idxs);CHKERRQ(ierr); 328908122e43SStefano Zampini /* shift for next computation */ 329008122e43SStefano Zampini cumarray += subset_size*subset_size; 329108122e43SStefano Zampini } 3292fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3293fd14bc51SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 3294fd14bc51SStefano Zampini } 329508122e43SStefano Zampini 329608122e43SStefano Zampini if (mss) { 329708122e43SStefano Zampini ierr = MatSeqAIJRestoreArray(sub_schurs->sum_S_Ej_inv_all,&Sarray);CHKERRQ(ierr); 329808122e43SStefano Zampini ierr = MatSeqAIJRestoreArray(sub_schurs->sum_S_Ej_tilda_all,&Starray);CHKERRQ(ierr); 3299f6f667cfSStefano Zampini /* destroy matrices (junk) */ 3300f6f667cfSStefano Zampini ierr = MatDestroy(&sub_schurs->sum_S_Ej_inv_all);CHKERRQ(ierr); 3301f6f667cfSStefano Zampini ierr = MatDestroy(&sub_schurs->sum_S_Ej_tilda_all);CHKERRQ(ierr); 330208122e43SStefano Zampini } 3303f6f667cfSStefano Zampini if (allocated_S_St) { 3304f6f667cfSStefano Zampini ierr = PetscFree2(S,St);CHKERRQ(ierr); 3305f6f667cfSStefano Zampini } 3306f6f667cfSStefano Zampini ierr = PetscFree5(eigv,eigs,work,B_iwork,B_ifail);CHKERRQ(ierr); 330708122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 330808122e43SStefano Zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 330908122e43SStefano Zampini #endif 331008122e43SStefano Zampini if (pcbddc->dbg_flag) { 33111b968477SStefano Zampini PetscInt maxneigs_r; 3312b2566f29SBarry Smith ierr = MPIU_Allreduce(&maxneigs,&maxneigs_r,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 33139b28b941SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Maximum number of constraints per cc %d\n",maxneigs_r);CHKERRQ(ierr); 331408122e43SStefano Zampini } 331508122e43SStefano Zampini PetscFunctionReturn(0); 331608122e43SStefano Zampini } 3317b1b3d7a2SStefano Zampini 3318c8587f34SStefano Zampini PetscErrorCode PCBDDCSetUpSolvers(PC pc) 3319c8587f34SStefano Zampini { 33208629588bSStefano Zampini PetscScalar *coarse_submat_vals; 3321c8587f34SStefano Zampini PetscErrorCode ierr; 3322c8587f34SStefano Zampini 3323c8587f34SStefano Zampini PetscFunctionBegin; 3324f4ddd8eeSStefano Zampini /* Setup local scatters R_to_B and (optionally) R_to_D */ 33255e8657edSStefano Zampini /* PCBDDCSetUpLocalWorkVectors should be called first! */ 3326c8587f34SStefano Zampini ierr = PCBDDCSetUpLocalScatters(pc);CHKERRQ(ierr); 3327c8587f34SStefano Zampini 3328684f6988SStefano Zampini /* Setup local neumann solver ksp_R */ 33290fccc4e9SStefano Zampini /* PCBDDCSetUpLocalScatters should be called first! */ 3330684f6988SStefano Zampini ierr = PCBDDCSetUpLocalSolvers(pc,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 3331c8587f34SStefano Zampini 33328629588bSStefano Zampini /* 33338629588bSStefano Zampini Setup local correction and local part of coarse basis. 33348629588bSStefano Zampini Gives back the dense local part of the coarse matrix in column major ordering 33358629588bSStefano Zampini */ 333647f4ddc3SStefano Zampini ierr = PCBDDCSetUpCorrection(pc,&coarse_submat_vals);CHKERRQ(ierr); 33378629588bSStefano Zampini 33388629588bSStefano Zampini /* Compute total number of coarse nodes and setup coarse solver */ 33398629588bSStefano Zampini ierr = PCBDDCSetUpCoarseSolver(pc,coarse_submat_vals);CHKERRQ(ierr); 33408629588bSStefano Zampini 33418629588bSStefano Zampini /* free */ 33428629588bSStefano Zampini ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 3343c8587f34SStefano Zampini PetscFunctionReturn(0); 3344c8587f34SStefano Zampini } 3345c8587f34SStefano Zampini 3346674ae819SStefano Zampini PetscErrorCode PCBDDCResetCustomization(PC pc) 3347674ae819SStefano Zampini { 3348674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3349674ae819SStefano Zampini PetscErrorCode ierr; 3350674ae819SStefano Zampini 3351674ae819SStefano Zampini PetscFunctionBegin; 3352674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->user_primal_vertices);CHKERRQ(ierr); 335330368db7SStefano Zampini ierr = ISDestroy(&pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 3354674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 3355785d1243SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr); 3356674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 3357f4ddd8eeSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->onearnullspace);CHKERRQ(ierr); 3358f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->onearnullvecs_state);CHKERRQ(ierr); 3359785d1243SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr); 336063602bcaSStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,0,NULL);CHKERRQ(ierr); 336163602bcaSStefano Zampini ierr = PCBDDCSetDofsSplittingLocal(pc,0,NULL);CHKERRQ(ierr); 3362674ae819SStefano Zampini PetscFunctionReturn(0); 3363674ae819SStefano Zampini } 3364674ae819SStefano Zampini 3365674ae819SStefano Zampini PetscErrorCode PCBDDCResetTopography(PC pc) 3366674ae819SStefano Zampini { 3367674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 33684f1b2e48SStefano Zampini PetscInt i; 3369674ae819SStefano Zampini PetscErrorCode ierr; 3370674ae819SStefano Zampini 3371674ae819SStefano Zampini PetscFunctionBegin; 33721e0482f5SStefano Zampini ierr = MatDestroy(&pcbddc->nedcG);CHKERRQ(ierr); 33731e0482f5SStefano Zampini ierr = ISDestroy(&pcbddc->nedclocal);CHKERRQ(ierr); 3374a13144ffSStefano Zampini ierr = MatDestroy(&pcbddc->discretegradient);CHKERRQ(ierr); 3375b9b85e73SStefano Zampini ierr = MatDestroy(&pcbddc->user_ChangeOfBasisMatrix);CHKERRQ(ierr); 3376674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 337716909a7fSStefano Zampini ierr = MatDestroy(&pcbddc->switch_static_change);CHKERRQ(ierr); 33781dd7afcfSStefano Zampini ierr = VecDestroy(&pcbddc->work_change);CHKERRQ(ierr); 3379674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 3380669cc0f4SStefano Zampini ierr = MatDestroy(&pcbddc->divudotp);CHKERRQ(ierr); 3381fa23a32eSStefano Zampini ierr = ISDestroy(&pcbddc->divudotp_vl2l);CHKERRQ(ierr); 33829326c5c6Sstefano_zampini ierr = PCBDDCGraphDestroy(&pcbddc->mat_graph);CHKERRQ(ierr); 33834f1b2e48SStefano Zampini for (i=0;i<pcbddc->n_local_subs;i++) { 33844f1b2e48SStefano Zampini ierr = ISDestroy(&pcbddc->local_subs[i]);CHKERRQ(ierr); 33854f1b2e48SStefano Zampini } 3386e68a0315Sstefano_zampini pcbddc->n_local_subs = 0; 33874f1b2e48SStefano Zampini ierr = PetscFree(pcbddc->local_subs);CHKERRQ(ierr); 3388e68a0315Sstefano_zampini ierr = PCBDDCSubSchursDestroy(&pcbddc->sub_schurs);CHKERRQ(ierr); 3389c703fcc7SStefano Zampini pcbddc->graphanalyzed = PETSC_FALSE; 33908af8fcf9SStefano Zampini pcbddc->recompute_topography = PETSC_TRUE; 3391674ae819SStefano Zampini PetscFunctionReturn(0); 3392674ae819SStefano Zampini } 3393674ae819SStefano Zampini 3394674ae819SStefano Zampini PetscErrorCode PCBDDCResetSolvers(PC pc) 3395674ae819SStefano Zampini { 3396674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3397674ae819SStefano Zampini PetscErrorCode ierr; 3398674ae819SStefano Zampini 3399674ae819SStefano Zampini PetscFunctionBegin; 3400674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 340158da7f69SStefano Zampini if (pcbddc->coarse_phi_B) { 3402ca92afb2SStefano Zampini PetscScalar *array; 340306656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&array);CHKERRQ(ierr); 340406656605SStefano Zampini ierr = PetscFree(array);CHKERRQ(ierr); 340558da7f69SStefano Zampini } 3406674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 3407674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 340815aaf578SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_B);CHKERRQ(ierr); 340915aaf578SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_D);CHKERRQ(ierr); 3410674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 3411674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 3412674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 341306656605SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 3414674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 3415674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 34168ce42a96SStefano Zampini ierr = ISDestroy(&pcbddc->is_R_local);CHKERRQ(ierr); 3417674ae819SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 3418674ae819SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 3419674ae819SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 34209326c5c6Sstefano_zampini ierr = KSPReset(pcbddc->ksp_D);CHKERRQ(ierr); 34219326c5c6Sstefano_zampini ierr = KSPReset(pcbddc->ksp_R);CHKERRQ(ierr); 34229326c5c6Sstefano_zampini ierr = KSPReset(pcbddc->coarse_ksp);CHKERRQ(ierr); 3423f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 3424727cdba6SStefano Zampini ierr = PetscFree(pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 34250e6343abSStefano Zampini ierr = PetscFree2(pcbddc->local_primal_ref_node,pcbddc->local_primal_ref_mult);CHKERRQ(ierr); 3426f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->global_primal_indices);CHKERRQ(ierr); 342770cf5478SStefano Zampini ierr = ISDestroy(&pcbddc->coarse_subassembling);CHKERRQ(ierr); 342881d14e9dSStefano Zampini ierr = MatDestroy(&pcbddc->benign_change);CHKERRQ(ierr); 34290369aaf7SStefano Zampini ierr = VecDestroy(&pcbddc->benign_vec);CHKERRQ(ierr); 34301dd7afcfSStefano Zampini ierr = PCBDDCBenignShellMat(pc,PETSC_TRUE);CHKERRQ(ierr); 34314f1b2e48SStefano Zampini ierr = MatDestroy(&pcbddc->benign_B0);CHKERRQ(ierr); 34328b9f24d4SStefano Zampini ierr = PetscSFDestroy(&pcbddc->benign_sf);CHKERRQ(ierr); 3433ca92afb2SStefano Zampini if (pcbddc->benign_zerodiag_subs) { 3434ca92afb2SStefano Zampini PetscInt i; 3435ca92afb2SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 3436ca92afb2SStefano Zampini ierr = ISDestroy(&pcbddc->benign_zerodiag_subs[i]);CHKERRQ(ierr); 3437ca92afb2SStefano Zampini } 3438ca92afb2SStefano Zampini ierr = PetscFree(pcbddc->benign_zerodiag_subs);CHKERRQ(ierr); 3439ca92afb2SStefano Zampini } 34404f1b2e48SStefano Zampini ierr = PetscFree3(pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx,pcbddc->benign_p0);CHKERRQ(ierr); 3441674ae819SStefano Zampini PetscFunctionReturn(0); 3442674ae819SStefano Zampini } 3443674ae819SStefano Zampini 3444f4ddd8eeSStefano Zampini PetscErrorCode PCBDDCSetUpLocalWorkVectors(PC pc) 34456bfb1811SStefano Zampini { 34466bfb1811SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 34476bfb1811SStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 34486bfb1811SStefano Zampini VecType impVecType; 34494f1b2e48SStefano Zampini PetscInt n_constraints,n_R,old_size; 34506bfb1811SStefano Zampini PetscErrorCode ierr; 34516bfb1811SStefano Zampini 34526bfb1811SStefano Zampini PetscFunctionBegin; 34534f1b2e48SStefano Zampini n_constraints = pcbddc->local_primal_size - pcbddc->benign_n - pcbddc->n_vertices; 3454b371cd4fSStefano Zampini n_R = pcis->n - pcbddc->n_vertices; 34556bfb1811SStefano Zampini ierr = VecGetType(pcis->vec1_N,&impVecType);CHKERRQ(ierr); 3456e7b262bdSStefano Zampini /* local work vectors (try to avoid unneeded work)*/ 3457e7b262bdSStefano Zampini /* R nodes */ 3458e7b262bdSStefano Zampini old_size = -1; 3459e7b262bdSStefano Zampini if (pcbddc->vec1_R) { 3460e7b262bdSStefano Zampini ierr = VecGetSize(pcbddc->vec1_R,&old_size);CHKERRQ(ierr); 3461e7b262bdSStefano Zampini } 3462e7b262bdSStefano Zampini if (n_R != old_size) { 3463e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 3464e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 34656bfb1811SStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_R);CHKERRQ(ierr); 34666bfb1811SStefano Zampini ierr = VecSetSizes(pcbddc->vec1_R,PETSC_DECIDE,n_R);CHKERRQ(ierr); 34676bfb1811SStefano Zampini ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 34686bfb1811SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 3469e7b262bdSStefano Zampini } 3470e7b262bdSStefano Zampini /* local primal dofs */ 3471e7b262bdSStefano Zampini old_size = -1; 3472e7b262bdSStefano Zampini if (pcbddc->vec1_P) { 3473e7b262bdSStefano Zampini ierr = VecGetSize(pcbddc->vec1_P,&old_size);CHKERRQ(ierr); 3474e7b262bdSStefano Zampini } 3475e9189074SStefano Zampini if (pcbddc->local_primal_size != old_size) { 3476e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 347783b7ccabSStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_P);CHKERRQ(ierr); 3478e9189074SStefano Zampini ierr = VecSetSizes(pcbddc->vec1_P,PETSC_DECIDE,pcbddc->local_primal_size);CHKERRQ(ierr); 34796bfb1811SStefano Zampini ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 3480e7b262bdSStefano Zampini } 3481e7b262bdSStefano Zampini /* local explicit constraints */ 3482e7b262bdSStefano Zampini old_size = -1; 3483e7b262bdSStefano Zampini if (pcbddc->vec1_C) { 3484e7b262bdSStefano Zampini ierr = VecGetSize(pcbddc->vec1_C,&old_size);CHKERRQ(ierr); 3485e7b262bdSStefano Zampini } 3486e7b262bdSStefano Zampini if (n_constraints && n_constraints != old_size) { 3487e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 348883b7ccabSStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_C);CHKERRQ(ierr); 348983b7ccabSStefano Zampini ierr = VecSetSizes(pcbddc->vec1_C,PETSC_DECIDE,n_constraints);CHKERRQ(ierr); 349083b7ccabSStefano Zampini ierr = VecSetType(pcbddc->vec1_C,impVecType);CHKERRQ(ierr); 349183b7ccabSStefano Zampini } 34926bfb1811SStefano Zampini PetscFunctionReturn(0); 34936bfb1811SStefano Zampini } 34946bfb1811SStefano Zampini 349547f4ddc3SStefano Zampini PetscErrorCode PCBDDCSetUpCorrection(PC pc, PetscScalar **coarse_submat_vals_n) 349688ebb749SStefano Zampini { 349725084f0cSStefano Zampini PetscErrorCode ierr; 349825084f0cSStefano Zampini /* pointers to pcis and pcbddc */ 349988ebb749SStefano Zampini PC_IS* pcis = (PC_IS*)pc->data; 350088ebb749SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 3501d62866d3SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 350225084f0cSStefano Zampini /* submatrices of local problem */ 350380677318SStefano Zampini Mat A_RV,A_VR,A_VV,local_auxmat2_R; 350406656605SStefano Zampini /* submatrices of local coarse problem */ 350506656605SStefano Zampini Mat S_VV,S_CV,S_VC,S_CC; 350625084f0cSStefano Zampini /* working matrices */ 350706656605SStefano Zampini Mat C_CR; 350825084f0cSStefano Zampini /* additional working stuff */ 350906656605SStefano Zampini PC pc_R; 3510c58f9fdbSStefano Zampini Mat F,Brhs = NULL; 35115cbda25cSStefano Zampini Vec dummy_vec; 3512c58f9fdbSStefano Zampini PetscBool isLU,isCHOL,isILU,need_benign_correction,sparserhs; 351325084f0cSStefano Zampini PetscScalar *coarse_submat_vals; /* TODO: use a PETSc matrix */ 351406656605SStefano Zampini PetscScalar *work; 351506656605SStefano Zampini PetscInt *idx_V_B; 3516ffd830a3SStefano Zampini PetscInt lda_rhs,n,n_vertices,n_constraints,*p0_lidx_I; 351706656605SStefano Zampini PetscInt i,n_R,n_D,n_B; 3518ffd830a3SStefano Zampini 351925084f0cSStefano Zampini /* some shortcuts to scalars */ 352006656605SStefano Zampini PetscScalar one=1.0,m_one=-1.0; 352188ebb749SStefano Zampini 352288ebb749SStefano Zampini PetscFunctionBegin; 35239a962809SStefano Zampini if (!pcbddc->symmetric_primal && pcbddc->benign_n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Non-symmetric primal basis computation with benign trick not yet implemented"); 3524ffd830a3SStefano Zampini 3525ffd830a3SStefano Zampini /* Set Non-overlapping dimensions */ 3526b371cd4fSStefano Zampini n_vertices = pcbddc->n_vertices; 35274f1b2e48SStefano Zampini n_constraints = pcbddc->local_primal_size - pcbddc->benign_n - n_vertices; 3528b371cd4fSStefano Zampini n_B = pcis->n_B; 3529b371cd4fSStefano Zampini n_D = pcis->n - n_B; 353088ebb749SStefano Zampini n_R = pcis->n - n_vertices; 353188ebb749SStefano Zampini 353288ebb749SStefano Zampini /* vertices in boundary numbering */ 3533785e854fSJed Brown ierr = PetscMalloc1(n_vertices,&idx_V_B);CHKERRQ(ierr); 35340e6343abSStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,n_vertices,pcbddc->local_primal_ref_node,&i,idx_V_B);CHKERRQ(ierr); 35356c4ed002SBarry Smith if (i != n_vertices) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for BDDC vertices! %D != %D\n",n_vertices,i); 353688ebb749SStefano Zampini 353706656605SStefano Zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 3538019a44ceSStefano Zampini ierr = PetscCalloc1(pcbddc->local_primal_size*pcbddc->local_primal_size,&coarse_submat_vals);CHKERRQ(ierr); 353906656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_vertices,n_vertices,coarse_submat_vals,&S_VV);CHKERRQ(ierr); 354006656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_VV,pcbddc->local_primal_size);CHKERRQ(ierr); 354106656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_constraints,n_vertices,coarse_submat_vals+n_vertices,&S_CV);CHKERRQ(ierr); 354206656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_CV,pcbddc->local_primal_size);CHKERRQ(ierr); 354306656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_vertices,n_constraints,coarse_submat_vals+pcbddc->local_primal_size*n_vertices,&S_VC);CHKERRQ(ierr); 354406656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_VC,pcbddc->local_primal_size);CHKERRQ(ierr); 354506656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_constraints,n_constraints,coarse_submat_vals+(pcbddc->local_primal_size+1)*n_vertices,&S_CC);CHKERRQ(ierr); 354606656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_CC,pcbddc->local_primal_size);CHKERRQ(ierr); 354706656605SStefano Zampini 354806656605SStefano Zampini /* determine if can use MatSolve routines instead of calling KSPSolve on ksp_R */ 354906656605SStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_R);CHKERRQ(ierr); 355006656605SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCLU,&isLU);CHKERRQ(ierr); 355106656605SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCILU,&isILU);CHKERRQ(ierr); 355206656605SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCCHOLESKY,&isCHOL);CHKERRQ(ierr); 3553ffd830a3SStefano Zampini lda_rhs = n_R; 3554a3df083aSStefano Zampini need_benign_correction = PETSC_FALSE; 355506656605SStefano Zampini if (isLU || isILU || isCHOL) { 355606656605SStefano Zampini ierr = PCFactorGetMatrix(pc_R,&F);CHKERRQ(ierr); 3557b334f244SStefano Zampini } else if (sub_schurs && sub_schurs->reuse_solver) { 3558df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3559d62866d3SStefano Zampini MatFactorType type; 3560d62866d3SStefano Zampini 3561df4d28bfSStefano Zampini F = reuse_solver->F; 35626816873aSStefano Zampini ierr = MatGetFactorType(F,&type);CHKERRQ(ierr); 3563d62866d3SStefano Zampini if (type == MAT_FACTOR_CHOLESKY) isCHOL = PETSC_TRUE; 3564ffd830a3SStefano Zampini ierr = MatGetSize(F,&lda_rhs,NULL);CHKERRQ(ierr); 356522db5ddcSStefano Zampini need_benign_correction = (PetscBool)(!!reuse_solver->benign_n); 356606656605SStefano Zampini } else { 356706656605SStefano Zampini F = NULL; 356806656605SStefano Zampini } 356906656605SStefano Zampini 3570c58f9fdbSStefano Zampini /* determine if we can use a sparse right-hand side */ 3571c58f9fdbSStefano Zampini sparserhs = PETSC_FALSE; 3572c58f9fdbSStefano Zampini if (F) { 3573c58f9fdbSStefano Zampini const MatSolverPackage solver; 3574c58f9fdbSStefano Zampini 3575c58f9fdbSStefano Zampini ierr = MatFactorGetSolverPackage(F,&solver);CHKERRQ(ierr); 3576c58f9fdbSStefano Zampini ierr = PetscStrcmp(solver,MATSOLVERMUMPS,&sparserhs);CHKERRQ(ierr); 3577c58f9fdbSStefano Zampini } 3578c58f9fdbSStefano Zampini 3579ffd830a3SStefano Zampini /* allocate workspace */ 3580ffd830a3SStefano Zampini n = 0; 3581ffd830a3SStefano Zampini if (n_constraints) { 3582ffd830a3SStefano Zampini n += lda_rhs*n_constraints; 3583ffd830a3SStefano Zampini } 3584ffd830a3SStefano Zampini if (n_vertices) { 3585ffd830a3SStefano Zampini n = PetscMax(2*lda_rhs*n_vertices,n); 3586ffd830a3SStefano Zampini n = PetscMax((lda_rhs+n_B)*n_vertices,n); 3587ffd830a3SStefano Zampini } 35882a3a6641Sstefano_zampini if (!pcbddc->symmetric_primal) { 35892a3a6641Sstefano_zampini n = PetscMax(2*lda_rhs*pcbddc->local_primal_size,n); 35902a3a6641Sstefano_zampini } 3591ffd830a3SStefano Zampini ierr = PetscMalloc1(n,&work);CHKERRQ(ierr); 3592ffd830a3SStefano Zampini 35935cbda25cSStefano Zampini /* create dummy vector to modify rhs and sol of MatMatSolve (work array will never be used) */ 35945cbda25cSStefano Zampini dummy_vec = NULL; 35955cbda25cSStefano Zampini if (need_benign_correction && lda_rhs != n_R && F) { 35965cbda25cSStefano Zampini ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lda_rhs,work,&dummy_vec);CHKERRQ(ierr); 35975cbda25cSStefano Zampini } 35985cbda25cSStefano Zampini 359988ebb749SStefano Zampini /* Precompute stuffs needed for preprocessing and application of BDDC*/ 360088ebb749SStefano Zampini if (n_constraints) { 360172b8c272SStefano Zampini Mat M1,M2,M3,C_B; 360206656605SStefano Zampini IS is_aux; 360380677318SStefano Zampini PetscScalar *array,*array2; 360406656605SStefano Zampini 3605f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 360680677318SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 360788ebb749SStefano Zampini 360825084f0cSStefano Zampini /* Extract constraints on R nodes: C_{CR} */ 360925084f0cSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_aux);CHKERRQ(ierr); 36107dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_aux,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 36117dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_aux,pcis->is_B_local,MAT_INITIAL_MATRIX,&C_B);CHKERRQ(ierr); 361288ebb749SStefano Zampini 361380677318SStefano Zampini /* Assemble local_auxmat2_R = (- A_{RR}^{-1} C^T_{CR}) needed by BDDC setup */ 361480677318SStefano Zampini /* Assemble pcbddc->local_auxmat2 = R_to_B (- A_{RR}^{-1} C^T_{CR}) needed by BDDC application */ 3615c58f9fdbSStefano Zampini if (!sparserhs) { 3616ffd830a3SStefano Zampini ierr = PetscMemzero(work,lda_rhs*n_constraints*sizeof(PetscScalar));CHKERRQ(ierr); 361788ebb749SStefano Zampini for (i=0;i<n_constraints;i++) { 361806656605SStefano Zampini const PetscScalar *row_cmat_values; 361906656605SStefano Zampini const PetscInt *row_cmat_indices; 362006656605SStefano Zampini PetscInt size_of_constraint,j; 362188ebb749SStefano Zampini 362206656605SStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,&row_cmat_indices,&row_cmat_values);CHKERRQ(ierr); 362306656605SStefano Zampini for (j=0;j<size_of_constraint;j++) { 3624ffd830a3SStefano Zampini work[row_cmat_indices[j]+i*lda_rhs] = -row_cmat_values[j]; 362506656605SStefano Zampini } 362606656605SStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,&row_cmat_indices,&row_cmat_values);CHKERRQ(ierr); 362706656605SStefano Zampini } 3628c58f9fdbSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,work,&Brhs);CHKERRQ(ierr); 3629c58f9fdbSStefano Zampini } else { 3630c58f9fdbSStefano Zampini Mat tC_CR; 3631c58f9fdbSStefano Zampini 3632c58f9fdbSStefano Zampini ierr = MatScale(C_CR,-1.0);CHKERRQ(ierr); 3633c58f9fdbSStefano Zampini if (lda_rhs != n_R) { 3634c58f9fdbSStefano Zampini PetscScalar *aa; 3635c58f9fdbSStefano Zampini PetscInt r,*ii,*jj; 3636c58f9fdbSStefano Zampini PetscBool done; 3637c58f9fdbSStefano Zampini 3638c58f9fdbSStefano Zampini ierr = MatGetRowIJ(C_CR,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 363913903a91SSatish Balay if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"GetRowIJ failed"); 3640c58f9fdbSStefano Zampini ierr = MatSeqAIJGetArray(C_CR,&aa);CHKERRQ(ierr); 3641c58f9fdbSStefano Zampini ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,n_constraints,lda_rhs,ii,jj,aa,&tC_CR);CHKERRQ(ierr); 3642c58f9fdbSStefano Zampini ierr = MatRestoreRowIJ(C_CR,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 364313903a91SSatish Balay if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"RestoreRowIJ failed"); 3644c58f9fdbSStefano Zampini } else { 3645c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)C_CR);CHKERRQ(ierr); 3646c58f9fdbSStefano Zampini tC_CR = C_CR; 3647c58f9fdbSStefano Zampini } 3648c58f9fdbSStefano Zampini ierr = MatCreateTranspose(tC_CR,&Brhs);CHKERRQ(ierr); 3649c58f9fdbSStefano Zampini ierr = MatDestroy(&tC_CR);CHKERRQ(ierr); 3650c58f9fdbSStefano Zampini } 3651ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,NULL,&local_auxmat2_R);CHKERRQ(ierr); 365206656605SStefano Zampini if (F) { 3653a3df083aSStefano Zampini if (need_benign_correction) { 3654df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3655a3df083aSStefano Zampini 365672b8c272SStefano Zampini /* rhs is already zero on interior dofs, no need to change the rhs */ 365772b8c272SStefano Zampini ierr = PetscMemzero(reuse_solver->benign_save_vals,pcbddc->benign_n*sizeof(PetscScalar));CHKERRQ(ierr); 3658a3df083aSStefano Zampini } 3659c58f9fdbSStefano Zampini ierr = MatMatSolve(F,Brhs,local_auxmat2_R);CHKERRQ(ierr); 3660a3df083aSStefano Zampini if (need_benign_correction) { 3661a3df083aSStefano Zampini PetscScalar *marr; 3662df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3663a3df083aSStefano Zampini 3664a3df083aSStefano Zampini ierr = MatDenseGetArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 36655cbda25cSStefano Zampini if (lda_rhs != n_R) { 36665cbda25cSStefano Zampini for (i=0;i<n_constraints;i++) { 36675cbda25cSStefano Zampini ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr); 36685cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 36695cbda25cSStefano Zampini ierr = VecResetArray(dummy_vec);CHKERRQ(ierr); 36705cbda25cSStefano Zampini } 36715cbda25cSStefano Zampini } else { 3672a3df083aSStefano Zampini for (i=0;i<n_constraints;i++) { 3673a3df083aSStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr); 36745cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 3675a3df083aSStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 3676a3df083aSStefano Zampini } 36775cbda25cSStefano Zampini } 3678a3df083aSStefano Zampini ierr = MatDenseRestoreArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 3679a3df083aSStefano Zampini } 368006656605SStefano Zampini } else { 368180677318SStefano Zampini PetscScalar *marr; 368280677318SStefano Zampini 368380677318SStefano Zampini ierr = MatDenseGetArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 368406656605SStefano Zampini for (i=0;i<n_constraints;i++) { 3685ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+i*lda_rhs);CHKERRQ(ierr); 3686ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,marr+i*lda_rhs);CHKERRQ(ierr); 368706656605SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 368806656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 368906656605SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 369006656605SStefano Zampini } 369180677318SStefano Zampini ierr = MatDenseRestoreArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 369206656605SStefano Zampini } 3693c58f9fdbSStefano Zampini if (sparserhs) { 3694c58f9fdbSStefano Zampini ierr = MatScale(C_CR,-1.0);CHKERRQ(ierr); 3695c58f9fdbSStefano Zampini } 3696c58f9fdbSStefano Zampini ierr = MatDestroy(&Brhs);CHKERRQ(ierr); 369780677318SStefano Zampini if (!pcbddc->switch_static) { 369880677318SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,n_constraints,NULL,&pcbddc->local_auxmat2);CHKERRQ(ierr); 369980677318SStefano Zampini ierr = MatDenseGetArray(pcbddc->local_auxmat2,&array);CHKERRQ(ierr); 370080677318SStefano Zampini ierr = MatDenseGetArray(local_auxmat2_R,&array2);CHKERRQ(ierr); 370180677318SStefano Zampini for (i=0;i<n_constraints;i++) { 3702ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,array2+i*lda_rhs);CHKERRQ(ierr); 370380677318SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,array+i*n_B);CHKERRQ(ierr); 370480677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 370580677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 370680677318SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 370780677318SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 370880677318SStefano Zampini } 370980677318SStefano Zampini ierr = MatDenseRestoreArray(local_auxmat2_R,&array2);CHKERRQ(ierr); 371080677318SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->local_auxmat2,&array);CHKERRQ(ierr); 371172b8c272SStefano Zampini ierr = MatMatMult(C_B,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&M3);CHKERRQ(ierr); 371280677318SStefano Zampini } else { 3713ffd830a3SStefano Zampini if (lda_rhs != n_R) { 3714ffd830a3SStefano Zampini IS dummy; 3715ffd830a3SStefano Zampini 3716ffd830a3SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_R,0,1,&dummy);CHKERRQ(ierr); 37177dae84e0SHong Zhang ierr = MatCreateSubMatrix(local_auxmat2_R,dummy,NULL,MAT_INITIAL_MATRIX,&pcbddc->local_auxmat2);CHKERRQ(ierr); 3718ffd830a3SStefano Zampini ierr = ISDestroy(&dummy);CHKERRQ(ierr); 3719ffd830a3SStefano Zampini } else { 372080677318SStefano Zampini ierr = PetscObjectReference((PetscObject)local_auxmat2_R);CHKERRQ(ierr); 372180677318SStefano Zampini pcbddc->local_auxmat2 = local_auxmat2_R; 3722ffd830a3SStefano Zampini } 372325084f0cSStefano Zampini ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&M3);CHKERRQ(ierr); 372480677318SStefano Zampini } 372580677318SStefano Zampini ierr = ISDestroy(&is_aux);CHKERRQ(ierr); 372680677318SStefano Zampini /* Assemble explicitly S_CC = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 372780677318SStefano Zampini ierr = MatScale(M3,m_one);CHKERRQ(ierr); 372806656605SStefano Zampini ierr = MatDuplicate(M3,MAT_DO_NOT_COPY_VALUES,&M1);CHKERRQ(ierr); 372906656605SStefano Zampini ierr = MatDuplicate(M3,MAT_DO_NOT_COPY_VALUES,&M2);CHKERRQ(ierr); 373080677318SStefano Zampini if (isCHOL) { 373180677318SStefano Zampini ierr = MatCholeskyFactor(M3,NULL,NULL);CHKERRQ(ierr); 373280677318SStefano Zampini } else { 373325084f0cSStefano Zampini ierr = MatLUFactor(M3,NULL,NULL,NULL);CHKERRQ(ierr); 373480677318SStefano Zampini } 373580677318SStefano Zampini ierr = VecSet(pcbddc->vec1_C,one);CHKERRQ(ierr); 373606656605SStefano Zampini ierr = MatDiagonalSet(M2,pcbddc->vec1_C,INSERT_VALUES);CHKERRQ(ierr); 373725084f0cSStefano Zampini ierr = MatMatSolve(M3,M2,M1);CHKERRQ(ierr); 373825084f0cSStefano Zampini ierr = MatDestroy(&M2);CHKERRQ(ierr); 373925084f0cSStefano Zampini ierr = MatDestroy(&M3);CHKERRQ(ierr); 374080677318SStefano Zampini /* Assemble local_auxmat1 = S_CC*C_{CB} needed by BDDC application in KSP and in preproc */ 374172b8c272SStefano Zampini ierr = MatMatMult(M1,C_B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 374272b8c272SStefano Zampini ierr = MatDestroy(&C_B);CHKERRQ(ierr); 374306656605SStefano Zampini ierr = MatCopy(M1,S_CC,SAME_NONZERO_PATTERN);CHKERRQ(ierr); /* S_CC can have a different LDA, MatMatSolve doesn't support it */ 374406656605SStefano Zampini ierr = MatDestroy(&M1);CHKERRQ(ierr); 3745f4ddd8eeSStefano Zampini } 3746fc227af8SStefano Zampini 3747fc227af8SStefano Zampini /* Get submatrices from subdomain matrix */ 374888ebb749SStefano Zampini if (n_vertices) { 374906656605SStefano Zampini IS is_aux; 3750c58f9fdbSStefano Zampini PetscBool isseqaij; 37513a50541eSStefano Zampini 3752b334f244SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { /* is_R_local is not sorted, ISComplement doesn't like it */ 37536816873aSStefano Zampini IS tis; 37546816873aSStefano Zampini 37556816873aSStefano Zampini ierr = ISDuplicate(pcbddc->is_R_local,&tis);CHKERRQ(ierr); 37566816873aSStefano Zampini ierr = ISSort(tis);CHKERRQ(ierr); 37576816873aSStefano Zampini ierr = ISComplement(tis,0,pcis->n,&is_aux);CHKERRQ(ierr); 37586816873aSStefano Zampini ierr = ISDestroy(&tis);CHKERRQ(ierr); 37596816873aSStefano Zampini } else { 37603a50541eSStefano Zampini ierr = ISComplement(pcbddc->is_R_local,0,pcis->n,&is_aux);CHKERRQ(ierr); 37616816873aSStefano Zampini } 37627dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,is_aux,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 37637dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,is_aux,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 3764c58f9fdbSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A_VR,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 3765c58f9fdbSStefano Zampini if (!isseqaij) { /* MatMatMult(A_VR,A_RRmA_RV) below will raise an error */ 3766c58f9fdbSStefano Zampini ierr = MatConvert(A_VR,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_VR);CHKERRQ(ierr); 3767c58f9fdbSStefano Zampini } 37687dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,is_aux,is_aux,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 376925084f0cSStefano Zampini ierr = ISDestroy(&is_aux);CHKERRQ(ierr); 377088ebb749SStefano Zampini } 377188ebb749SStefano Zampini 377288ebb749SStefano Zampini /* Matrix of coarse basis functions (local) */ 3773f4ddd8eeSStefano Zampini if (pcbddc->coarse_phi_B) { 377406656605SStefano Zampini PetscInt on_B,on_primal,on_D=n_D; 377506656605SStefano Zampini if (pcbddc->coarse_phi_D) { 377606656605SStefano Zampini ierr = MatGetSize(pcbddc->coarse_phi_D,&on_D,NULL);CHKERRQ(ierr); 377706656605SStefano Zampini } 3778f4ddd8eeSStefano Zampini ierr = MatGetSize(pcbddc->coarse_phi_B,&on_B,&on_primal);CHKERRQ(ierr); 377906656605SStefano Zampini if (on_B != n_B || on_primal != pcbddc->local_primal_size || on_D != n_D) { 378006656605SStefano Zampini PetscScalar *marray; 378106656605SStefano Zampini 378206656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&marray);CHKERRQ(ierr); 378306656605SStefano Zampini ierr = PetscFree(marray);CHKERRQ(ierr); 3784f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 3785f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_B);CHKERRQ(ierr); 3786f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 3787f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_D);CHKERRQ(ierr); 3788f4ddd8eeSStefano Zampini } 3789f4ddd8eeSStefano Zampini } 379006656605SStefano Zampini 3791f4ddd8eeSStefano Zampini if (!pcbddc->coarse_phi_B) { 3792a6e023c1Sstefano_zampini PetscScalar *marr; 379388ebb749SStefano Zampini 3794a6e023c1Sstefano_zampini /* memory size */ 379506656605SStefano Zampini n = n_B*pcbddc->local_primal_size; 3796a6e023c1Sstefano_zampini if (pcbddc->switch_static || pcbddc->dbg_flag) n += n_D*pcbddc->local_primal_size; 3797a6e023c1Sstefano_zampini if (!pcbddc->symmetric_primal) n *= 2; 3798a6e023c1Sstefano_zampini ierr = PetscCalloc1(n,&marr);CHKERRQ(ierr); 3799a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,pcbddc->local_primal_size,marr,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 3800a6e023c1Sstefano_zampini marr += n_B*pcbddc->local_primal_size; 38018eeda7d8SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 3802a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_D,pcbddc->local_primal_size,marr,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 3803a6e023c1Sstefano_zampini marr += n_D*pcbddc->local_primal_size; 380488ebb749SStefano Zampini } 38053301b35fSStefano Zampini if (!pcbddc->symmetric_primal) { 3806a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,pcbddc->local_primal_size,marr,&pcbddc->coarse_psi_B);CHKERRQ(ierr); 3807a6e023c1Sstefano_zampini marr += n_B*pcbddc->local_primal_size; 38088eeda7d8SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 3809a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_D,pcbddc->local_primal_size,marr,&pcbddc->coarse_psi_D);CHKERRQ(ierr); 381088ebb749SStefano Zampini } 381188ebb749SStefano Zampini } else { 3812c0553b1fSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->coarse_phi_B);CHKERRQ(ierr); 3813c0553b1fSStefano Zampini pcbddc->coarse_psi_B = pcbddc->coarse_phi_B; 38141b968477SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 3815c0553b1fSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->coarse_phi_D);CHKERRQ(ierr); 3816c0553b1fSStefano Zampini pcbddc->coarse_psi_D = pcbddc->coarse_phi_D; 3817c0553b1fSStefano Zampini } 381888ebb749SStefano Zampini } 381906656605SStefano Zampini } 3820019a44ceSStefano Zampini 382106656605SStefano Zampini /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 38224f1b2e48SStefano Zampini p0_lidx_I = NULL; 38234f1b2e48SStefano Zampini if (pcbddc->benign_n && (pcbddc->switch_static || pcbddc->dbg_flag)) { 3824d12edf2fSStefano Zampini const PetscInt *idxs; 3825d12edf2fSStefano Zampini 3826d12edf2fSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,&idxs);CHKERRQ(ierr); 38274f1b2e48SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&p0_lidx_I);CHKERRQ(ierr); 38284f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 38294f1b2e48SStefano Zampini ierr = PetscFindInt(pcbddc->benign_p0_lidx[i],pcis->n-pcis->n_B,idxs,&p0_lidx_I[i]);CHKERRQ(ierr); 38304f1b2e48SStefano Zampini } 3831d12edf2fSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,&idxs);CHKERRQ(ierr); 3832d12edf2fSStefano Zampini } 3833d16cbb6bSStefano Zampini 383406656605SStefano Zampini /* vertices */ 383506656605SStefano Zampini if (n_vertices) { 3836c58f9fdbSStefano Zampini PetscBool restoreavr = PETSC_FALSE; 383716f15bc4SStefano Zampini 3838af25d912SStefano Zampini ierr = MatConvert(A_VV,MATDENSE,MAT_INPLACE_MATRIX,&A_VV);CHKERRQ(ierr); 383904708bb6SStefano Zampini 384016f15bc4SStefano Zampini if (n_R) { 384114393ed6SStefano Zampini Mat A_RRmA_RV,A_RV_bcorr=NULL,S_VVt; /* S_VVt with LDA=N */ 384206656605SStefano Zampini PetscBLASInt B_N,B_one = 1; 384316f15bc4SStefano Zampini PetscScalar *x,*y; 384406656605SStefano Zampini 384521eccb56SStefano Zampini ierr = MatScale(A_RV,m_one);CHKERRQ(ierr); 384614393ed6SStefano Zampini if (need_benign_correction) { 384714393ed6SStefano Zampini ISLocalToGlobalMapping RtoN; 384814393ed6SStefano Zampini IS is_p0; 384914393ed6SStefano Zampini PetscInt *idxs_p0,n; 385014393ed6SStefano Zampini 385114393ed6SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&idxs_p0);CHKERRQ(ierr); 385214393ed6SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(pcbddc->is_R_local,&RtoN);CHKERRQ(ierr); 385314393ed6SStefano Zampini ierr = ISGlobalToLocalMappingApply(RtoN,IS_GTOLM_DROP,pcbddc->benign_n,pcbddc->benign_p0_lidx,&n,idxs_p0);CHKERRQ(ierr); 3854af25d912SStefano Zampini if (n != pcbddc->benign_n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in R numbering for benign p0! %d != %d\n",n,pcbddc->benign_n); 385514393ed6SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&RtoN);CHKERRQ(ierr); 385614393ed6SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n,idxs_p0,PETSC_OWN_POINTER,&is_p0);CHKERRQ(ierr); 38577dae84e0SHong Zhang ierr = MatCreateSubMatrix(A_RV,is_p0,NULL,MAT_INITIAL_MATRIX,&A_RV_bcorr);CHKERRQ(ierr); 385814393ed6SStefano Zampini ierr = ISDestroy(&is_p0);CHKERRQ(ierr); 385914393ed6SStefano Zampini } 386014393ed6SStefano Zampini 3861c58f9fdbSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,work,&A_RRmA_RV);CHKERRQ(ierr); 3862c58f9fdbSStefano Zampini if (!sparserhs || need_benign_correction) { 3863ffd830a3SStefano Zampini if (lda_rhs == n_R) { 3864af25d912SStefano Zampini ierr = MatConvert(A_RV,MATDENSE,MAT_INPLACE_MATRIX,&A_RV);CHKERRQ(ierr); 3865ffd830a3SStefano Zampini } else { 3866ca92afb2SStefano Zampini PetscScalar *av,*array; 3867ca92afb2SStefano Zampini const PetscInt *xadj,*adjncy; 3868ca92afb2SStefano Zampini PetscInt n; 3869ca92afb2SStefano Zampini PetscBool flg_row; 3870ffd830a3SStefano Zampini 3871ca92afb2SStefano Zampini array = work+lda_rhs*n_vertices; 3872ca92afb2SStefano Zampini ierr = PetscMemzero(array,lda_rhs*n_vertices*sizeof(PetscScalar));CHKERRQ(ierr); 38739d54b7f4SStefano Zampini ierr = MatConvert(A_RV,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_RV);CHKERRQ(ierr); 3874ca92afb2SStefano Zampini ierr = MatGetRowIJ(A_RV,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 3875ca92afb2SStefano Zampini ierr = MatSeqAIJGetArray(A_RV,&av);CHKERRQ(ierr); 3876ca92afb2SStefano Zampini for (i=0;i<n;i++) { 3877ca92afb2SStefano Zampini PetscInt j; 3878ca92afb2SStefano Zampini for (j=xadj[i];j<xadj[i+1];j++) array[lda_rhs*adjncy[j]+i] = av[j]; 3879ffd830a3SStefano Zampini } 3880ca92afb2SStefano Zampini ierr = MatRestoreRowIJ(A_RV,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 3881ca92afb2SStefano Zampini ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 3882ca92afb2SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,array,&A_RV);CHKERRQ(ierr); 3883ffd830a3SStefano Zampini } 3884a3df083aSStefano Zampini if (need_benign_correction) { 3885df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3886a3df083aSStefano Zampini PetscScalar *marr; 3887a3df083aSStefano Zampini 3888a3df083aSStefano Zampini ierr = MatDenseGetArray(A_RV,&marr);CHKERRQ(ierr); 388914393ed6SStefano Zampini /* need \Phi^T A_RV = (I+L)A_RV, L given by 389014393ed6SStefano Zampini 389114393ed6SStefano Zampini | 0 0 0 | (V) 389214393ed6SStefano Zampini L = | 0 0 -1 | (P-p0) 389314393ed6SStefano Zampini | 0 0 -1 | (p0) 389414393ed6SStefano Zampini 389514393ed6SStefano Zampini */ 3896df4d28bfSStefano Zampini for (i=0;i<reuse_solver->benign_n;i++) { 389714393ed6SStefano Zampini const PetscScalar *vals; 389814393ed6SStefano Zampini const PetscInt *idxs,*idxs_zero; 389914393ed6SStefano Zampini PetscInt n,j,nz; 390014393ed6SStefano Zampini 3901df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 3902df4d28bfSStefano Zampini ierr = ISGetIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 390314393ed6SStefano Zampini ierr = MatGetRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 390414393ed6SStefano Zampini for (j=0;j<n;j++) { 390514393ed6SStefano Zampini PetscScalar val = vals[j]; 390614393ed6SStefano Zampini PetscInt k,col = idxs[j]; 390714393ed6SStefano Zampini for (k=0;k<nz;k++) marr[idxs_zero[k]+lda_rhs*col] -= val; 390814393ed6SStefano Zampini } 390914393ed6SStefano Zampini ierr = MatRestoreRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 3910df4d28bfSStefano Zampini ierr = ISRestoreIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 391114393ed6SStefano Zampini } 391272b8c272SStefano Zampini ierr = MatDenseRestoreArray(A_RV,&marr);CHKERRQ(ierr); 391372b8c272SStefano Zampini } 3914c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)A_RV);CHKERRQ(ierr); 3915c58f9fdbSStefano Zampini Brhs = A_RV; 3916c58f9fdbSStefano Zampini } else { 3917c58f9fdbSStefano Zampini Mat tA_RVT,A_RVT; 3918c58f9fdbSStefano Zampini 3919c58f9fdbSStefano Zampini if (!pcbddc->symmetric_primal) { 3920c58f9fdbSStefano Zampini ierr = MatTranspose(A_RV,MAT_INITIAL_MATRIX,&A_RVT);CHKERRQ(ierr); 3921c58f9fdbSStefano Zampini } else { 3922c58f9fdbSStefano Zampini restoreavr = PETSC_TRUE; 3923c58f9fdbSStefano Zampini ierr = MatScale(A_VR,-1.0);CHKERRQ(ierr); 3924c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)A_VR);CHKERRQ(ierr); 3925c58f9fdbSStefano Zampini A_RVT = A_VR; 3926c58f9fdbSStefano Zampini } 3927c58f9fdbSStefano Zampini if (lda_rhs != n_R) { 3928c58f9fdbSStefano Zampini PetscScalar *aa; 3929c58f9fdbSStefano Zampini PetscInt r,*ii,*jj; 3930c58f9fdbSStefano Zampini PetscBool done; 3931c58f9fdbSStefano Zampini 3932c58f9fdbSStefano Zampini ierr = MatGetRowIJ(A_RVT,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 393313903a91SSatish Balay if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"GetRowIJ failed"); 3934c58f9fdbSStefano Zampini ierr = MatSeqAIJGetArray(A_RVT,&aa);CHKERRQ(ierr); 3935c58f9fdbSStefano Zampini ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,n_vertices,lda_rhs,ii,jj,aa,&tA_RVT);CHKERRQ(ierr); 3936c58f9fdbSStefano Zampini ierr = MatRestoreRowIJ(A_RVT,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 393713903a91SSatish Balay if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"RestoreRowIJ failed"); 3938c58f9fdbSStefano Zampini } else { 3939c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)A_RVT);CHKERRQ(ierr); 3940c58f9fdbSStefano Zampini tA_RVT = A_RVT; 3941c58f9fdbSStefano Zampini } 3942c58f9fdbSStefano Zampini ierr = MatCreateTranspose(tA_RVT,&Brhs);CHKERRQ(ierr); 3943c58f9fdbSStefano Zampini ierr = MatDestroy(&tA_RVT);CHKERRQ(ierr); 3944c58f9fdbSStefano Zampini ierr = MatDestroy(&A_RVT);CHKERRQ(ierr); 3945c58f9fdbSStefano Zampini } 394672b8c272SStefano Zampini if (F) { 394714393ed6SStefano Zampini /* need to correct the rhs */ 394872b8c272SStefano Zampini if (need_benign_correction) { 394972b8c272SStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 395072b8c272SStefano Zampini PetscScalar *marr; 395172b8c272SStefano Zampini 3952c58f9fdbSStefano Zampini ierr = MatDenseGetArray(Brhs,&marr);CHKERRQ(ierr); 39535cbda25cSStefano Zampini if (lda_rhs != n_R) { 39545cbda25cSStefano Zampini for (i=0;i<n_vertices;i++) { 39555cbda25cSStefano Zampini ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr); 39565cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 39575cbda25cSStefano Zampini ierr = VecResetArray(dummy_vec);CHKERRQ(ierr); 39585cbda25cSStefano Zampini } 39595cbda25cSStefano Zampini } else { 3960a3df083aSStefano Zampini for (i=0;i<n_vertices;i++) { 3961a3df083aSStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr); 39625cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 3963a3df083aSStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 3964a3df083aSStefano Zampini } 39655cbda25cSStefano Zampini } 3966c58f9fdbSStefano Zampini ierr = MatDenseRestoreArray(Brhs,&marr);CHKERRQ(ierr); 3967a3df083aSStefano Zampini } 3968c58f9fdbSStefano Zampini ierr = MatMatSolve(F,Brhs,A_RRmA_RV);CHKERRQ(ierr); 3969c58f9fdbSStefano Zampini if (restoreavr) { 3970c58f9fdbSStefano Zampini ierr = MatScale(A_VR,-1.0);CHKERRQ(ierr); 3971c58f9fdbSStefano Zampini } 397214393ed6SStefano Zampini /* need to correct the solution */ 3973a3df083aSStefano Zampini if (need_benign_correction) { 3974df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3975a3df083aSStefano Zampini PetscScalar *marr; 3976a3df083aSStefano Zampini 3977a3df083aSStefano Zampini ierr = MatDenseGetArray(A_RRmA_RV,&marr);CHKERRQ(ierr); 39785cbda25cSStefano Zampini if (lda_rhs != n_R) { 39795cbda25cSStefano Zampini for (i=0;i<n_vertices;i++) { 39805cbda25cSStefano Zampini ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr); 39815cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 39825cbda25cSStefano Zampini ierr = VecResetArray(dummy_vec);CHKERRQ(ierr); 39835cbda25cSStefano Zampini } 39845cbda25cSStefano Zampini } else { 3985a3df083aSStefano Zampini for (i=0;i<n_vertices;i++) { 3986a3df083aSStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr); 39875cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 3988a3df083aSStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 3989a3df083aSStefano Zampini } 39905cbda25cSStefano Zampini } 3991a3df083aSStefano Zampini ierr = MatDenseRestoreArray(A_RRmA_RV,&marr);CHKERRQ(ierr); 3992a3df083aSStefano Zampini } 399306656605SStefano Zampini } else { 3994c58f9fdbSStefano Zampini ierr = MatDenseGetArray(Brhs,&y);CHKERRQ(ierr); 399506656605SStefano Zampini for (i=0;i<n_vertices;i++) { 3996ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,y+i*lda_rhs);CHKERRQ(ierr); 3997ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,work+i*lda_rhs);CHKERRQ(ierr); 399806656605SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 399906656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 400006656605SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 400106656605SStefano Zampini } 4002c58f9fdbSStefano Zampini ierr = MatDenseRestoreArray(Brhs,&y);CHKERRQ(ierr); 400306656605SStefano Zampini } 400480677318SStefano Zampini ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 4005c58f9fdbSStefano Zampini ierr = MatDestroy(&Brhs);CHKERRQ(ierr); 4006ffd830a3SStefano Zampini /* S_VV and S_CV */ 400706656605SStefano Zampini if (n_constraints) { 400806656605SStefano Zampini Mat B; 400980677318SStefano Zampini 4010ffd830a3SStefano Zampini ierr = PetscMemzero(work+lda_rhs*n_vertices,n_B*n_vertices*sizeof(PetscScalar));CHKERRQ(ierr); 401180677318SStefano Zampini for (i=0;i<n_vertices;i++) { 4012ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+i*lda_rhs);CHKERRQ(ierr); 4013ffd830a3SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,work+lda_rhs*n_vertices+i*n_B);CHKERRQ(ierr); 401480677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 401580677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 401680677318SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 401780677318SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 401880677318SStefano Zampini } 4019ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,n_vertices,work+lda_rhs*n_vertices,&B);CHKERRQ(ierr); 402080677318SStefano Zampini ierr = MatMatMult(pcbddc->local_auxmat1,B,MAT_REUSE_MATRIX,PETSC_DEFAULT,&S_CV);CHKERRQ(ierr); 402180677318SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 4022ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,work+lda_rhs*n_vertices,&B);CHKERRQ(ierr); 402380677318SStefano Zampini ierr = MatMatMult(local_auxmat2_R,S_CV,MAT_REUSE_MATRIX,PETSC_DEFAULT,&B);CHKERRQ(ierr); 402406656605SStefano Zampini ierr = MatScale(S_CV,m_one);CHKERRQ(ierr); 4025ffd830a3SStefano Zampini ierr = PetscBLASIntCast(lda_rhs*n_vertices,&B_N);CHKERRQ(ierr); 4026ffd830a3SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&B_N,&one,work+lda_rhs*n_vertices,&B_one,work,&B_one)); 402706656605SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 402806656605SStefano Zampini } 4029ffd830a3SStefano Zampini if (lda_rhs != n_R) { 4030ffd830a3SStefano Zampini ierr = MatDestroy(&A_RRmA_RV);CHKERRQ(ierr); 4031ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_vertices,work,&A_RRmA_RV);CHKERRQ(ierr); 4032ffd830a3SStefano Zampini ierr = MatSeqDenseSetLDA(A_RRmA_RV,lda_rhs);CHKERRQ(ierr); 4033ffd830a3SStefano Zampini } 403406656605SStefano Zampini ierr = MatMatMult(A_VR,A_RRmA_RV,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&S_VVt);CHKERRQ(ierr); 403514393ed6SStefano Zampini /* need A_VR * \Phi * A_RRmA_RV = A_VR * (I+L)^T * A_RRmA_RV, L given as before */ 403614393ed6SStefano Zampini if (need_benign_correction) { 4037df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 403814393ed6SStefano Zampini PetscScalar *marr,*sums; 403914393ed6SStefano Zampini 404014393ed6SStefano Zampini ierr = PetscMalloc1(n_vertices,&sums);CHKERRQ(ierr); 4041f913dca9SStefano Zampini ierr = MatDenseGetArray(S_VVt,&marr);CHKERRQ(ierr); 4042df4d28bfSStefano Zampini for (i=0;i<reuse_solver->benign_n;i++) { 404314393ed6SStefano Zampini const PetscScalar *vals; 404414393ed6SStefano Zampini const PetscInt *idxs,*idxs_zero; 404514393ed6SStefano Zampini PetscInt n,j,nz; 404614393ed6SStefano Zampini 4047df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 4048df4d28bfSStefano Zampini ierr = ISGetIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 404914393ed6SStefano Zampini for (j=0;j<n_vertices;j++) { 405014393ed6SStefano Zampini PetscInt k; 405114393ed6SStefano Zampini sums[j] = 0.; 405214393ed6SStefano Zampini for (k=0;k<nz;k++) sums[j] += work[idxs_zero[k]+j*lda_rhs]; 405314393ed6SStefano Zampini } 405414393ed6SStefano Zampini ierr = MatGetRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 405514393ed6SStefano Zampini for (j=0;j<n;j++) { 405614393ed6SStefano Zampini PetscScalar val = vals[j]; 405714393ed6SStefano Zampini PetscInt k; 405814393ed6SStefano Zampini for (k=0;k<n_vertices;k++) { 405914393ed6SStefano Zampini marr[idxs[j]+k*n_vertices] += val*sums[k]; 406014393ed6SStefano Zampini } 406114393ed6SStefano Zampini } 406214393ed6SStefano Zampini ierr = MatRestoreRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 4063df4d28bfSStefano Zampini ierr = ISRestoreIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 406414393ed6SStefano Zampini } 406514393ed6SStefano Zampini ierr = PetscFree(sums);CHKERRQ(ierr); 4066f913dca9SStefano Zampini ierr = MatDenseRestoreArray(S_VVt,&marr);CHKERRQ(ierr); 406714393ed6SStefano Zampini ierr = MatDestroy(&A_RV_bcorr);CHKERRQ(ierr); 406814393ed6SStefano Zampini } 406980677318SStefano Zampini ierr = MatDestroy(&A_RRmA_RV);CHKERRQ(ierr); 407006656605SStefano Zampini ierr = PetscBLASIntCast(n_vertices*n_vertices,&B_N);CHKERRQ(ierr); 407106656605SStefano Zampini ierr = MatDenseGetArray(A_VV,&x);CHKERRQ(ierr); 407206656605SStefano Zampini ierr = MatDenseGetArray(S_VVt,&y);CHKERRQ(ierr); 407306656605SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&B_N,&one,x,&B_one,y,&B_one)); 407406656605SStefano Zampini ierr = MatDenseRestoreArray(A_VV,&x);CHKERRQ(ierr); 407506656605SStefano Zampini ierr = MatDenseRestoreArray(S_VVt,&y);CHKERRQ(ierr); 407606656605SStefano Zampini ierr = MatCopy(S_VVt,S_VV,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 4077d16cbb6bSStefano Zampini ierr = MatDestroy(&S_VVt);CHKERRQ(ierr); 4078019a44ceSStefano Zampini } else { 4079d16cbb6bSStefano Zampini ierr = MatCopy(A_VV,S_VV,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 4080d16cbb6bSStefano Zampini } 408121eccb56SStefano Zampini ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 4082d16cbb6bSStefano Zampini 408306656605SStefano Zampini /* coarse basis functions */ 408406656605SStefano Zampini for (i=0;i<n_vertices;i++) { 408516f15bc4SStefano Zampini PetscScalar *y; 408616f15bc4SStefano Zampini 4087ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+lda_rhs*i);CHKERRQ(ierr); 408806656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 408906656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,y+n_B*i);CHKERRQ(ierr); 409006656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 409106656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 409206656605SStefano Zampini y[n_B*i+idx_V_B[i]] = 1.0; 409306656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 409406656605SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 409506656605SStefano Zampini 409606656605SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 40974f1b2e48SStefano Zampini PetscInt j; 40984f1b2e48SStefano Zampini 409906656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 410006656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_D,y+n_D*i);CHKERRQ(ierr); 410106656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 410206656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 410306656605SStefano Zampini ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr); 41044f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) y[n_D*i+p0_lidx_I[j]] = 0.0; 410506656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 410606656605SStefano Zampini } 410706656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 410806656605SStefano Zampini } 410904708bb6SStefano Zampini /* if n_R == 0 the object is not destroyed */ 411004708bb6SStefano Zampini ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 411106656605SStefano Zampini } 41125cbda25cSStefano Zampini ierr = VecDestroy(&dummy_vec);CHKERRQ(ierr); 411306656605SStefano Zampini 411406656605SStefano Zampini if (n_constraints) { 411506656605SStefano Zampini Mat B; 411606656605SStefano Zampini 4117ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,work,&B);CHKERRQ(ierr); 411806656605SStefano Zampini ierr = MatScale(S_CC,m_one);CHKERRQ(ierr); 411980677318SStefano Zampini ierr = MatMatMult(local_auxmat2_R,S_CC,MAT_REUSE_MATRIX,PETSC_DEFAULT,&B);CHKERRQ(ierr); 412006656605SStefano Zampini ierr = MatScale(S_CC,m_one);CHKERRQ(ierr); 412106656605SStefano Zampini if (n_vertices) { 412280677318SStefano Zampini if (isCHOL) { /* if we can solve the interior problem with cholesky, we should also be fine with transposing here */ 412380677318SStefano Zampini ierr = MatTranspose(S_CV,MAT_REUSE_MATRIX,&S_VC);CHKERRQ(ierr); 412480677318SStefano Zampini } else { 412580677318SStefano Zampini Mat S_VCt; 412680677318SStefano Zampini 4127ffd830a3SStefano Zampini if (lda_rhs != n_R) { 4128ffd830a3SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 412972b8c272SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_constraints,work,&B);CHKERRQ(ierr); 4130ffd830a3SStefano Zampini ierr = MatSeqDenseSetLDA(B,lda_rhs);CHKERRQ(ierr); 4131ffd830a3SStefano Zampini } 413280677318SStefano Zampini ierr = MatMatMult(A_VR,B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&S_VCt);CHKERRQ(ierr); 413380677318SStefano Zampini ierr = MatCopy(S_VCt,S_VC,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 413480677318SStefano Zampini ierr = MatDestroy(&S_VCt);CHKERRQ(ierr); 413580677318SStefano Zampini } 413606656605SStefano Zampini } 413706656605SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 413806656605SStefano Zampini /* coarse basis functions */ 413906656605SStefano Zampini for (i=0;i<n_constraints;i++) { 414006656605SStefano Zampini PetscScalar *y; 414106656605SStefano Zampini 4142ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+lda_rhs*i);CHKERRQ(ierr); 414306656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 414406656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,y+n_B*(i+n_vertices));CHKERRQ(ierr); 414506656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 414606656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 414706656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 414806656605SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 414906656605SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 41504f1b2e48SStefano Zampini PetscInt j; 41514f1b2e48SStefano Zampini 415206656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 415306656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_D,y+n_D*(i+n_vertices));CHKERRQ(ierr); 415406656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 415506656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 415606656605SStefano Zampini ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr); 41574f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) y[n_D*i+p0_lidx_I[j]] = 0.0; 415806656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 415906656605SStefano Zampini } 416006656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 416106656605SStefano Zampini } 416206656605SStefano Zampini } 416380677318SStefano Zampini if (n_constraints) { 416480677318SStefano Zampini ierr = MatDestroy(&local_auxmat2_R);CHKERRQ(ierr); 416580677318SStefano Zampini } 41664f1b2e48SStefano Zampini ierr = PetscFree(p0_lidx_I);CHKERRQ(ierr); 416772b8c272SStefano Zampini 416872b8c272SStefano Zampini /* coarse matrix entries relative to B_0 */ 416972b8c272SStefano Zampini if (pcbddc->benign_n) { 417072b8c272SStefano Zampini Mat B0_B,B0_BPHI; 417172b8c272SStefano Zampini IS is_dummy; 417272b8c272SStefano Zampini PetscScalar *data; 417372b8c272SStefano Zampini PetscInt j; 417472b8c272SStefano Zampini 417572b8c272SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr); 41767dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->benign_B0,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr); 417772b8c272SStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 417872b8c272SStefano Zampini ierr = MatMatMult(B0_B,pcbddc->coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&B0_BPHI);CHKERRQ(ierr); 417986c38910SStefano Zampini ierr = MatConvert(B0_BPHI,MATSEQDENSE,MAT_INPLACE_MATRIX,&B0_BPHI);CHKERRQ(ierr); 418072b8c272SStefano Zampini ierr = MatDenseGetArray(B0_BPHI,&data);CHKERRQ(ierr); 418172b8c272SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) { 418272b8c272SStefano Zampini PetscInt primal_idx = pcbddc->local_primal_size - pcbddc->benign_n + j; 418372b8c272SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 418472b8c272SStefano Zampini coarse_submat_vals[primal_idx*pcbddc->local_primal_size+i] = data[i*pcbddc->benign_n+j]; 418572b8c272SStefano Zampini coarse_submat_vals[i*pcbddc->local_primal_size+primal_idx] = data[i*pcbddc->benign_n+j]; 418672b8c272SStefano Zampini } 418772b8c272SStefano Zampini } 418872b8c272SStefano Zampini ierr = MatDenseRestoreArray(B0_BPHI,&data);CHKERRQ(ierr); 418972b8c272SStefano Zampini ierr = MatDestroy(&B0_B);CHKERRQ(ierr); 419072b8c272SStefano Zampini ierr = MatDestroy(&B0_BPHI);CHKERRQ(ierr); 419172b8c272SStefano Zampini } 4192019a44ceSStefano Zampini 419306656605SStefano Zampini /* compute other basis functions for non-symmetric problems */ 41943301b35fSStefano Zampini if (!pcbddc->symmetric_primal) { 4195ffd830a3SStefano Zampini Mat B_V=NULL,B_C=NULL; 4196ffd830a3SStefano Zampini PetscScalar *marray; 419706656605SStefano Zampini 419806656605SStefano Zampini if (n_constraints) { 4199ffd830a3SStefano Zampini Mat S_CCT,C_CRT; 420006656605SStefano Zampini 4201abc8f43dSstefano_zampini ierr = MatTranspose(C_CR,MAT_INITIAL_MATRIX,&C_CRT);CHKERRQ(ierr); 420206656605SStefano Zampini ierr = MatTranspose(S_CC,MAT_INITIAL_MATRIX,&S_CCT);CHKERRQ(ierr); 4203ffd830a3SStefano Zampini ierr = MatMatMult(C_CRT,S_CCT,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&B_C);CHKERRQ(ierr); 420416f15bc4SStefano Zampini ierr = MatDestroy(&S_CCT);CHKERRQ(ierr); 420506656605SStefano Zampini if (n_vertices) { 4206ffd830a3SStefano Zampini Mat S_VCT; 420706656605SStefano Zampini 420806656605SStefano Zampini ierr = MatTranspose(S_VC,MAT_INITIAL_MATRIX,&S_VCT);CHKERRQ(ierr); 4209ffd830a3SStefano Zampini ierr = MatMatMult(C_CRT,S_VCT,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&B_V);CHKERRQ(ierr); 421016f15bc4SStefano Zampini ierr = MatDestroy(&S_VCT);CHKERRQ(ierr); 421106656605SStefano Zampini } 4212ffd830a3SStefano Zampini ierr = MatDestroy(&C_CRT);CHKERRQ(ierr); 42135b782168SStefano Zampini } else { 42145b782168SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_vertices,NULL,&B_V);CHKERRQ(ierr); 421506656605SStefano Zampini } 421616f15bc4SStefano Zampini if (n_vertices && n_R) { 4217ffd830a3SStefano Zampini PetscScalar *av,*marray; 4218ffd830a3SStefano Zampini const PetscInt *xadj,*adjncy; 4219ffd830a3SStefano Zampini PetscInt n; 4220ffd830a3SStefano Zampini PetscBool flg_row; 422106656605SStefano Zampini 4222ffd830a3SStefano Zampini /* B_V = B_V - A_VR^T */ 4223af25d912SStefano Zampini ierr = MatConvert(A_VR,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_VR);CHKERRQ(ierr); 4224ffd830a3SStefano Zampini ierr = MatGetRowIJ(A_VR,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 4225ffd830a3SStefano Zampini ierr = MatSeqAIJGetArray(A_VR,&av);CHKERRQ(ierr); 4226ffd830a3SStefano Zampini ierr = MatDenseGetArray(B_V,&marray);CHKERRQ(ierr); 4227ffd830a3SStefano Zampini for (i=0;i<n;i++) { 4228ffd830a3SStefano Zampini PetscInt j; 4229ffd830a3SStefano Zampini for (j=xadj[i];j<xadj[i+1];j++) marray[i*n_R + adjncy[j]] -= av[j]; 4230ffd830a3SStefano Zampini } 4231ffd830a3SStefano Zampini ierr = MatDenseRestoreArray(B_V,&marray);CHKERRQ(ierr); 4232ffd830a3SStefano Zampini ierr = MatRestoreRowIJ(A_VR,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 4233ffd830a3SStefano Zampini ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 423406656605SStefano Zampini } 423506656605SStefano Zampini 4236ffd830a3SStefano Zampini /* currently there's no support for MatTransposeMatSolve(F,B,X) */ 4237abc8f43dSstefano_zampini if (n_vertices) { 4238ffd830a3SStefano Zampini ierr = MatDenseGetArray(B_V,&marray);CHKERRQ(ierr); 4239ffd830a3SStefano Zampini for (i=0;i<n_vertices;i++) { 4240ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marray+i*n_R);CHKERRQ(ierr); 4241ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,work+i*n_R);CHKERRQ(ierr); 424206656605SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 424306656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 424406656605SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 424506656605SStefano Zampini } 4246ffd830a3SStefano Zampini ierr = MatDenseRestoreArray(B_V,&marray);CHKERRQ(ierr); 4247abc8f43dSstefano_zampini } 42485b782168SStefano Zampini if (B_C) { 4249ffd830a3SStefano Zampini ierr = MatDenseGetArray(B_C,&marray);CHKERRQ(ierr); 4250ffd830a3SStefano Zampini for (i=n_vertices;i<n_constraints+n_vertices;i++) { 4251ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marray+(i-n_vertices)*n_R);CHKERRQ(ierr); 4252ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,work+i*n_R);CHKERRQ(ierr); 4253ffd830a3SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 4254ffd830a3SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 4255ffd830a3SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 425606656605SStefano Zampini } 4257ffd830a3SStefano Zampini ierr = MatDenseRestoreArray(B_C,&marray);CHKERRQ(ierr); 42585b782168SStefano Zampini } 425906656605SStefano Zampini /* coarse basis functions */ 426006656605SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 426106656605SStefano Zampini PetscScalar *y; 426206656605SStefano Zampini 4263ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+i*n_R);CHKERRQ(ierr); 426406656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_psi_B,&y);CHKERRQ(ierr); 426506656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,y+n_B*i);CHKERRQ(ierr); 426606656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 426706656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 426806656605SStefano Zampini if (i<n_vertices) { 426906656605SStefano Zampini y[n_B*i+idx_V_B[i]] = 1.0; 427006656605SStefano Zampini } 427106656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_psi_B,&y);CHKERRQ(ierr); 427206656605SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 427306656605SStefano Zampini 427406656605SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 427506656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_psi_D,&y);CHKERRQ(ierr); 427606656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_D,y+n_D*i);CHKERRQ(ierr); 427706656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 427806656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 427906656605SStefano Zampini ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr); 428006656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_psi_D,&y);CHKERRQ(ierr); 428106656605SStefano Zampini } 428206656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 428306656605SStefano Zampini } 4284ffd830a3SStefano Zampini ierr = MatDestroy(&B_V);CHKERRQ(ierr); 4285ffd830a3SStefano Zampini ierr = MatDestroy(&B_C);CHKERRQ(ierr); 428606656605SStefano Zampini } 4287a6e023c1Sstefano_zampini 4288d62866d3SStefano Zampini /* free memory */ 428988ebb749SStefano Zampini ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 429006656605SStefano Zampini ierr = MatDestroy(&S_VV);CHKERRQ(ierr); 429106656605SStefano Zampini ierr = MatDestroy(&S_CV);CHKERRQ(ierr); 429206656605SStefano Zampini ierr = MatDestroy(&S_VC);CHKERRQ(ierr); 429306656605SStefano Zampini ierr = MatDestroy(&S_CC);CHKERRQ(ierr); 4294d62866d3SStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 4295d62866d3SStefano Zampini if (n_vertices) { 4296d62866d3SStefano Zampini ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 4297d62866d3SStefano Zampini } 4298d62866d3SStefano Zampini if (n_constraints) { 4299d62866d3SStefano Zampini ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 4300d62866d3SStefano Zampini } 430188ebb749SStefano Zampini /* Checking coarse_sub_mat and coarse basis functios */ 430288ebb749SStefano Zampini /* Symmetric case : It should be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 430388ebb749SStefano Zampini /* Non-symmetric case : It should be \Psi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 4304d12edf2fSStefano Zampini if (pcbddc->dbg_flag) { 430588ebb749SStefano Zampini Mat coarse_sub_mat; 430625084f0cSStefano Zampini Mat AUXMAT,TM1,TM2,TM3,TM4; 430788ebb749SStefano Zampini Mat coarse_phi_D,coarse_phi_B; 430888ebb749SStefano Zampini Mat coarse_psi_D,coarse_psi_B; 430988ebb749SStefano Zampini Mat A_II,A_BB,A_IB,A_BI; 43108bec7fa6SStefano Zampini Mat C_B,CPHI; 43118bec7fa6SStefano Zampini IS is_dummy; 43128bec7fa6SStefano Zampini Vec mones; 431388ebb749SStefano Zampini MatType checkmattype=MATSEQAIJ; 431488ebb749SStefano Zampini PetscReal real_value; 431588ebb749SStefano Zampini 4316a3df083aSStefano Zampini if (pcbddc->benign_n && !pcbddc->benign_change_explicit) { 4317a3df083aSStefano Zampini Mat A; 4318a3df083aSStefano Zampini ierr = PCBDDCBenignProject(pc,NULL,NULL,&A);CHKERRQ(ierr); 43197dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_I_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 43207dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 43217dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 43227dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 4323a3df083aSStefano Zampini ierr = MatDestroy(&A);CHKERRQ(ierr); 4324a3df083aSStefano Zampini } else { 432588ebb749SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 432688ebb749SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 432788ebb749SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 432888ebb749SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 4329a3df083aSStefano Zampini } 433088ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 433188ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 4332ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 433388ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_psi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_D);CHKERRQ(ierr); 433488ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_psi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_B);CHKERRQ(ierr); 433588ebb749SStefano Zampini } 433688ebb749SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 433788ebb749SStefano Zampini 433825084f0cSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 43393301b35fSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check coarse sub mat computation (symmetric %d)\n",pcbddc->symmetric_primal);CHKERRQ(ierr); 434025084f0cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 4341ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 434288ebb749SStefano Zampini ierr = MatMatMult(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 434388ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 434488ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 434588ebb749SStefano Zampini ierr = MatMatMult(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 434688ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 434788ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 434888ebb749SStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 434988ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 435088ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 435188ebb749SStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 435288ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 435388ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 435488ebb749SStefano Zampini } else { 435588ebb749SStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 435688ebb749SStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 435788ebb749SStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 435888ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 435988ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 436088ebb749SStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 436188ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 436288ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 436388ebb749SStefano Zampini } 436488ebb749SStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 436588ebb749SStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 436688ebb749SStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 4367511c6705SHong Zhang ierr = MatConvert(TM1,MATSEQDENSE,MAT_INPLACE_MATRIX,&TM1);CHKERRQ(ierr); 43684f1b2e48SStefano Zampini if (pcbddc->benign_n) { 4369fc227af8SStefano Zampini Mat B0_B,B0_BPHI; 4370d12edf2fSStefano Zampini PetscScalar *data,*data2; 43714f1b2e48SStefano Zampini PetscInt j; 4372d12edf2fSStefano Zampini 43734f1b2e48SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr); 43747dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->benign_B0,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr); 4375d12edf2fSStefano Zampini ierr = MatMatMult(B0_B,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&B0_BPHI);CHKERRQ(ierr); 437686c38910SStefano Zampini ierr = MatConvert(B0_BPHI,MATSEQDENSE,MAT_INPLACE_MATRIX,&B0_BPHI);CHKERRQ(ierr); 4377d12edf2fSStefano Zampini ierr = MatDenseGetArray(TM1,&data);CHKERRQ(ierr); 4378d12edf2fSStefano Zampini ierr = MatDenseGetArray(B0_BPHI,&data2);CHKERRQ(ierr); 43794f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) { 43804f1b2e48SStefano Zampini PetscInt primal_idx = pcbddc->local_primal_size - pcbddc->benign_n + j; 4381d12edf2fSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 43824f1b2e48SStefano Zampini data[primal_idx*pcbddc->local_primal_size+i] += data2[i*pcbddc->benign_n+j]; 43834f1b2e48SStefano Zampini data[i*pcbddc->local_primal_size+primal_idx] += data2[i*pcbddc->benign_n+j]; 43844f1b2e48SStefano Zampini } 4385d12edf2fSStefano Zampini } 4386d12edf2fSStefano Zampini ierr = MatDenseRestoreArray(TM1,&data);CHKERRQ(ierr); 4387d12edf2fSStefano Zampini ierr = MatDenseRestoreArray(B0_BPHI,&data2);CHKERRQ(ierr); 4388d12edf2fSStefano Zampini ierr = MatDestroy(&B0_B);CHKERRQ(ierr); 4389d12edf2fSStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 4390d12edf2fSStefano Zampini ierr = MatDestroy(&B0_BPHI);CHKERRQ(ierr); 4391d12edf2fSStefano Zampini } 4392d12edf2fSStefano Zampini #if 0 4393d12edf2fSStefano Zampini { 4394d12edf2fSStefano Zampini PetscViewer viewer; 4395d12edf2fSStefano Zampini char filename[256]; 4396ffd830a3SStefano Zampini sprintf(filename,"details_local_coarse_mat%d_level%d.m",PetscGlobalRank,pcbddc->current_level); 4397d12edf2fSStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&viewer);CHKERRQ(ierr); 4398d12edf2fSStefano Zampini ierr = PetscViewerSetFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 4399ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)coarse_sub_mat,"computed");CHKERRQ(ierr); 4400ffd830a3SStefano Zampini ierr = MatView(coarse_sub_mat,viewer);CHKERRQ(ierr); 4401ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)TM1,"projected");CHKERRQ(ierr); 4402d12edf2fSStefano Zampini ierr = MatView(TM1,viewer);CHKERRQ(ierr); 440372b8c272SStefano Zampini if (save_change) { 440472b8c272SStefano Zampini Mat phi_B; 440572b8c272SStefano Zampini ierr = MatMatMult(save_change,pcbddc->coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&phi_B);CHKERRQ(ierr); 440672b8c272SStefano Zampini ierr = PetscObjectSetName((PetscObject)phi_B,"phi_B");CHKERRQ(ierr); 440772b8c272SStefano Zampini ierr = MatView(phi_B,viewer);CHKERRQ(ierr); 440872b8c272SStefano Zampini ierr = MatDestroy(&phi_B);CHKERRQ(ierr); 440972b8c272SStefano Zampini } else { 4410ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_phi_B,"phi_B");CHKERRQ(ierr); 4411ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_phi_B,viewer);CHKERRQ(ierr); 441272b8c272SStefano Zampini } 4413ffd830a3SStefano Zampini if (pcbddc->coarse_phi_D) { 4414ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_phi_D,"phi_D");CHKERRQ(ierr); 4415ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_phi_D,viewer);CHKERRQ(ierr); 4416ffd830a3SStefano Zampini } 4417ffd830a3SStefano Zampini if (pcbddc->coarse_psi_B) { 4418ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_psi_B,"psi_B");CHKERRQ(ierr); 4419ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_psi_B,viewer);CHKERRQ(ierr); 4420ffd830a3SStefano Zampini } 442172b8c272SStefano Zampini if (pcbddc->coarse_psi_D) { 4422ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_psi_D,"psi_D");CHKERRQ(ierr); 4423ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_psi_D,viewer);CHKERRQ(ierr); 4424ffd830a3SStefano Zampini } 4425d12edf2fSStefano Zampini ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 4426d12edf2fSStefano Zampini } 4427d12edf2fSStefano Zampini #endif 442881d9aea3SBarry Smith ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 44298bec7fa6SStefano Zampini ierr = MatNorm(TM1,NORM_FROBENIUS,&real_value);CHKERRQ(ierr); 44301575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 443106656605SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d matrix error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr); 44328bec7fa6SStefano Zampini 44338bec7fa6SStefano Zampini /* check constraints */ 4434a00504b5SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size-pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr); 44357dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&C_B);CHKERRQ(ierr); 44364f1b2e48SStefano Zampini if (!pcbddc->benign_n) { /* TODO: add benign case */ 44378bec7fa6SStefano Zampini ierr = MatMatMult(C_B,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&CPHI);CHKERRQ(ierr); 4438a00504b5SStefano Zampini } else { 4439a00504b5SStefano Zampini PetscScalar *data; 4440a00504b5SStefano Zampini Mat tmat; 4441a00504b5SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&data);CHKERRQ(ierr); 4442a00504b5SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcis->n_B,pcbddc->local_primal_size-pcbddc->benign_n,data,&tmat);CHKERRQ(ierr); 4443a00504b5SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&data);CHKERRQ(ierr); 4444a00504b5SStefano Zampini ierr = MatMatMult(C_B,tmat,MAT_INITIAL_MATRIX,1.0,&CPHI);CHKERRQ(ierr); 4445a00504b5SStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 4446a00504b5SStefano Zampini } 44478bec7fa6SStefano Zampini ierr = MatCreateVecs(CPHI,&mones,NULL);CHKERRQ(ierr); 44488bec7fa6SStefano Zampini ierr = VecSet(mones,-1.0);CHKERRQ(ierr); 44498bec7fa6SStefano Zampini ierr = MatDiagonalSet(CPHI,mones,ADD_VALUES);CHKERRQ(ierr); 44508bec7fa6SStefano Zampini ierr = MatNorm(CPHI,NORM_FROBENIUS,&real_value);CHKERRQ(ierr); 4451bdae7319SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d phi constraints error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr); 4452ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 4453bdae7319SStefano Zampini ierr = MatMatMult(C_B,coarse_psi_B,MAT_REUSE_MATRIX,1.0,&CPHI);CHKERRQ(ierr); 4454bdae7319SStefano Zampini ierr = VecSet(mones,-1.0);CHKERRQ(ierr); 4455bdae7319SStefano Zampini ierr = MatDiagonalSet(CPHI,mones,ADD_VALUES);CHKERRQ(ierr); 4456bdae7319SStefano Zampini ierr = MatNorm(CPHI,NORM_FROBENIUS,&real_value);CHKERRQ(ierr); 4457bdae7319SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d psi constraints error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr); 445888ebb749SStefano Zampini } 44598bec7fa6SStefano Zampini ierr = MatDestroy(&C_B);CHKERRQ(ierr); 44608bec7fa6SStefano Zampini ierr = MatDestroy(&CPHI);CHKERRQ(ierr); 44618bec7fa6SStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 44628bec7fa6SStefano Zampini ierr = VecDestroy(&mones);CHKERRQ(ierr); 446325084f0cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 446488ebb749SStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 446588ebb749SStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 446688ebb749SStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 446788ebb749SStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 446888ebb749SStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 446988ebb749SStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 447088ebb749SStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 447188ebb749SStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 447288ebb749SStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 447388ebb749SStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 4474ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 447588ebb749SStefano Zampini ierr = MatDestroy(&coarse_psi_D);CHKERRQ(ierr); 447688ebb749SStefano Zampini ierr = MatDestroy(&coarse_psi_B);CHKERRQ(ierr); 447788ebb749SStefano Zampini } 447888ebb749SStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 447988ebb749SStefano Zampini } 44808629588bSStefano Zampini /* get back data */ 44818629588bSStefano Zampini *coarse_submat_vals_n = coarse_submat_vals; 448288ebb749SStefano Zampini PetscFunctionReturn(0); 448388ebb749SStefano Zampini } 448488ebb749SStefano Zampini 44857dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrixUnsorted(Mat A, IS isrow, IS iscol, Mat* B) 4486aa0d41d4SStefano Zampini { 4487d65f70fdSStefano Zampini Mat *work_mat; 4488d65f70fdSStefano Zampini IS isrow_s,iscol_s; 4489d65f70fdSStefano Zampini PetscBool rsorted,csorted; 4490c43ebad9SStefano Zampini PetscInt rsize,*idxs_perm_r=NULL,csize,*idxs_perm_c=NULL; 4491aa0d41d4SStefano Zampini PetscErrorCode ierr; 4492aa0d41d4SStefano Zampini 4493aa0d41d4SStefano Zampini PetscFunctionBegin; 4494d65f70fdSStefano Zampini ierr = ISSorted(isrow,&rsorted);CHKERRQ(ierr); 4495d65f70fdSStefano Zampini ierr = ISSorted(iscol,&csorted);CHKERRQ(ierr); 4496d65f70fdSStefano Zampini ierr = ISGetLocalSize(isrow,&rsize);CHKERRQ(ierr); 4497d65f70fdSStefano Zampini ierr = ISGetLocalSize(iscol,&csize);CHKERRQ(ierr); 4498aa0d41d4SStefano Zampini 4499d65f70fdSStefano Zampini if (!rsorted) { 4500906d46d4SStefano Zampini const PetscInt *idxs; 4501906d46d4SStefano Zampini PetscInt *idxs_sorted,i; 4502aa0d41d4SStefano Zampini 4503d65f70fdSStefano Zampini ierr = PetscMalloc1(rsize,&idxs_perm_r);CHKERRQ(ierr); 4504d65f70fdSStefano Zampini ierr = PetscMalloc1(rsize,&idxs_sorted);CHKERRQ(ierr); 4505d65f70fdSStefano Zampini for (i=0;i<rsize;i++) { 4506d65f70fdSStefano Zampini idxs_perm_r[i] = i; 4507aa0d41d4SStefano Zampini } 4508d65f70fdSStefano Zampini ierr = ISGetIndices(isrow,&idxs);CHKERRQ(ierr); 4509d65f70fdSStefano Zampini ierr = PetscSortIntWithPermutation(rsize,idxs,idxs_perm_r);CHKERRQ(ierr); 4510d65f70fdSStefano Zampini for (i=0;i<rsize;i++) { 4511d65f70fdSStefano Zampini idxs_sorted[i] = idxs[idxs_perm_r[i]]; 4512aa0d41d4SStefano Zampini } 4513d65f70fdSStefano Zampini ierr = ISRestoreIndices(isrow,&idxs);CHKERRQ(ierr); 4514d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,rsize,idxs_sorted,PETSC_OWN_POINTER,&isrow_s);CHKERRQ(ierr); 4515d65f70fdSStefano Zampini } else { 4516d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)isrow);CHKERRQ(ierr); 4517d65f70fdSStefano Zampini isrow_s = isrow; 4518aa0d41d4SStefano Zampini } 4519906d46d4SStefano Zampini 4520d65f70fdSStefano Zampini if (!csorted) { 4521d65f70fdSStefano Zampini if (isrow == iscol) { 4522d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)isrow_s);CHKERRQ(ierr); 4523d65f70fdSStefano Zampini iscol_s = isrow_s; 4524d65f70fdSStefano Zampini } else { 4525d65f70fdSStefano Zampini const PetscInt *idxs; 4526d65f70fdSStefano Zampini PetscInt *idxs_sorted,i; 4527906d46d4SStefano Zampini 4528d65f70fdSStefano Zampini ierr = PetscMalloc1(csize,&idxs_perm_c);CHKERRQ(ierr); 4529d65f70fdSStefano Zampini ierr = PetscMalloc1(csize,&idxs_sorted);CHKERRQ(ierr); 4530d65f70fdSStefano Zampini for (i=0;i<csize;i++) { 4531d65f70fdSStefano Zampini idxs_perm_c[i] = i; 4532d65f70fdSStefano Zampini } 4533d65f70fdSStefano Zampini ierr = ISGetIndices(iscol,&idxs);CHKERRQ(ierr); 4534d65f70fdSStefano Zampini ierr = PetscSortIntWithPermutation(csize,idxs,idxs_perm_c);CHKERRQ(ierr); 4535d65f70fdSStefano Zampini for (i=0;i<csize;i++) { 4536d65f70fdSStefano Zampini idxs_sorted[i] = idxs[idxs_perm_c[i]]; 4537d65f70fdSStefano Zampini } 4538d65f70fdSStefano Zampini ierr = ISRestoreIndices(iscol,&idxs);CHKERRQ(ierr); 4539d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,csize,idxs_sorted,PETSC_OWN_POINTER,&iscol_s);CHKERRQ(ierr); 4540d65f70fdSStefano Zampini } 4541d65f70fdSStefano Zampini } else { 4542d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)iscol);CHKERRQ(ierr); 4543d65f70fdSStefano Zampini iscol_s = iscol; 4544d65f70fdSStefano Zampini } 4545d65f70fdSStefano Zampini 45467dae84e0SHong Zhang ierr = MatCreateSubMatrices(A,1,&isrow_s,&iscol_s,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 4547d65f70fdSStefano Zampini 4548d65f70fdSStefano Zampini if (!rsorted || !csorted) { 4549906d46d4SStefano Zampini Mat new_mat; 4550d65f70fdSStefano Zampini IS is_perm_r,is_perm_c; 4551906d46d4SStefano Zampini 4552d65f70fdSStefano Zampini if (!rsorted) { 4553d65f70fdSStefano Zampini PetscInt *idxs_r,i; 4554d65f70fdSStefano Zampini ierr = PetscMalloc1(rsize,&idxs_r);CHKERRQ(ierr); 4555d65f70fdSStefano Zampini for (i=0;i<rsize;i++) { 4556d65f70fdSStefano Zampini idxs_r[idxs_perm_r[i]] = i; 4557906d46d4SStefano Zampini } 4558d65f70fdSStefano Zampini ierr = PetscFree(idxs_perm_r);CHKERRQ(ierr); 4559d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,rsize,idxs_r,PETSC_OWN_POINTER,&is_perm_r);CHKERRQ(ierr); 4560d65f70fdSStefano Zampini } else { 4561d65f70fdSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,rsize,0,1,&is_perm_r);CHKERRQ(ierr); 4562906d46d4SStefano Zampini } 4563d65f70fdSStefano Zampini ierr = ISSetPermutation(is_perm_r);CHKERRQ(ierr); 4564d65f70fdSStefano Zampini 4565d65f70fdSStefano Zampini if (!csorted) { 4566d65f70fdSStefano Zampini if (isrow_s == iscol_s) { 4567d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)is_perm_r);CHKERRQ(ierr); 4568d65f70fdSStefano Zampini is_perm_c = is_perm_r; 4569d65f70fdSStefano Zampini } else { 4570d65f70fdSStefano Zampini PetscInt *idxs_c,i; 4571f913dca9SStefano Zampini if (!idxs_perm_c) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Permutation array not present"); 4572d65f70fdSStefano Zampini ierr = PetscMalloc1(csize,&idxs_c);CHKERRQ(ierr); 4573d65f70fdSStefano Zampini for (i=0;i<csize;i++) { 4574d65f70fdSStefano Zampini idxs_c[idxs_perm_c[i]] = i; 4575d65f70fdSStefano Zampini } 4576d65f70fdSStefano Zampini ierr = PetscFree(idxs_perm_c);CHKERRQ(ierr); 4577d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,csize,idxs_c,PETSC_OWN_POINTER,&is_perm_c);CHKERRQ(ierr); 4578d65f70fdSStefano Zampini } 4579d65f70fdSStefano Zampini } else { 4580d65f70fdSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,csize,0,1,&is_perm_c);CHKERRQ(ierr); 4581d65f70fdSStefano Zampini } 4582d65f70fdSStefano Zampini ierr = ISSetPermutation(is_perm_c);CHKERRQ(ierr); 4583d65f70fdSStefano Zampini 4584d65f70fdSStefano Zampini ierr = MatPermute(work_mat[0],is_perm_r,is_perm_c,&new_mat);CHKERRQ(ierr); 4585d65f70fdSStefano Zampini ierr = MatDestroy(&work_mat[0]);CHKERRQ(ierr); 4586d65f70fdSStefano Zampini work_mat[0] = new_mat; 4587d65f70fdSStefano Zampini ierr = ISDestroy(&is_perm_r);CHKERRQ(ierr); 4588d65f70fdSStefano Zampini ierr = ISDestroy(&is_perm_c);CHKERRQ(ierr); 4589d65f70fdSStefano Zampini } 4590d65f70fdSStefano Zampini 4591d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)work_mat[0]);CHKERRQ(ierr); 4592d65f70fdSStefano Zampini *B = work_mat[0]; 4593d65f70fdSStefano Zampini ierr = MatDestroyMatrices(1,&work_mat);CHKERRQ(ierr); 4594d65f70fdSStefano Zampini ierr = ISDestroy(&isrow_s);CHKERRQ(ierr); 4595d65f70fdSStefano Zampini ierr = ISDestroy(&iscol_s);CHKERRQ(ierr); 4596d65f70fdSStefano Zampini PetscFunctionReturn(0); 4597d65f70fdSStefano Zampini } 4598d65f70fdSStefano Zampini 45995e8657edSStefano Zampini PetscErrorCode PCBDDCComputeLocalMatrix(PC pc, Mat ChangeOfBasisMatrix) 4600aa0d41d4SStefano Zampini { 4601aa0d41d4SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 46025e8657edSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 4603022d8d2bSstefano_zampini Mat new_mat,lA; 46045e8657edSStefano Zampini IS is_local,is_global; 4605d65f70fdSStefano Zampini PetscInt local_size; 4606d65f70fdSStefano Zampini PetscBool isseqaij; 4607aa0d41d4SStefano Zampini PetscErrorCode ierr; 4608aa0d41d4SStefano Zampini 4609aa0d41d4SStefano Zampini PetscFunctionBegin; 4610aa0d41d4SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 46115e8657edSStefano Zampini ierr = MatGetSize(matis->A,&local_size,NULL);CHKERRQ(ierr); 46125e8657edSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)matis->A),local_size,0,1,&is_local);CHKERRQ(ierr); 4613b087196eSStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pc->pmat->rmap->mapping,is_local,&is_global);CHKERRQ(ierr); 4614aa0d41d4SStefano Zampini ierr = ISDestroy(&is_local);CHKERRQ(ierr); 46157dae84e0SHong Zhang ierr = MatCreateSubMatrixUnsorted(ChangeOfBasisMatrix,is_global,is_global,&new_mat);CHKERRQ(ierr); 4616aa0d41d4SStefano Zampini ierr = ISDestroy(&is_global);CHKERRQ(ierr); 4617906d46d4SStefano Zampini 4618906d46d4SStefano Zampini /* check */ 4619906d46d4SStefano Zampini if (pcbddc->dbg_flag) { 4620906d46d4SStefano Zampini Vec x,x_change; 4621906d46d4SStefano Zampini PetscReal error; 4622906d46d4SStefano Zampini 46235e8657edSStefano Zampini ierr = MatCreateVecs(ChangeOfBasisMatrix,&x,&x_change);CHKERRQ(ierr); 4624906d46d4SStefano Zampini ierr = VecSetRandom(x,NULL);CHKERRQ(ierr); 46255e8657edSStefano Zampini ierr = MatMult(ChangeOfBasisMatrix,x,x_change);CHKERRQ(ierr); 4626e176bc59SStefano Zampini ierr = VecScatterBegin(matis->cctx,x,matis->x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4627e176bc59SStefano Zampini ierr = VecScatterEnd(matis->cctx,x,matis->x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4628d65f70fdSStefano Zampini ierr = MatMult(new_mat,matis->x,matis->y);CHKERRQ(ierr); 462988428137SStefano Zampini if (!pcbddc->change_interior) { 463088428137SStefano Zampini const PetscScalar *x,*y,*v; 463188428137SStefano Zampini PetscReal lerror = 0.; 463288428137SStefano Zampini PetscInt i; 463388428137SStefano Zampini 463488428137SStefano Zampini ierr = VecGetArrayRead(matis->x,&x);CHKERRQ(ierr); 463588428137SStefano Zampini ierr = VecGetArrayRead(matis->y,&y);CHKERRQ(ierr); 463688428137SStefano Zampini ierr = VecGetArrayRead(matis->counter,&v);CHKERRQ(ierr); 463788428137SStefano Zampini for (i=0;i<local_size;i++) 463888428137SStefano Zampini if (PetscRealPart(v[i]) < 1.5 && PetscAbsScalar(x[i]-y[i]) > lerror) 463988428137SStefano Zampini lerror = PetscAbsScalar(x[i]-y[i]); 464088428137SStefano Zampini ierr = VecRestoreArrayRead(matis->x,&x);CHKERRQ(ierr); 464188428137SStefano Zampini ierr = VecRestoreArrayRead(matis->y,&y);CHKERRQ(ierr); 464288428137SStefano Zampini ierr = VecRestoreArrayRead(matis->counter,&v);CHKERRQ(ierr); 464388428137SStefano Zampini ierr = MPIU_Allreduce(&lerror,&error,1,MPIU_REAL,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 4644637e8532SStefano Zampini if (error > PETSC_SMALL) { 4645637e8532SStefano Zampini if (!pcbddc->user_ChangeOfBasisMatrix || pcbddc->current_level) { 4646637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on I: %1.6e\n",error); 4647637e8532SStefano Zampini } else { 4648637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Error global vs local change on I: %1.6e\n",error); 4649637e8532SStefano Zampini } 4650637e8532SStefano Zampini } 465188428137SStefano Zampini } 4652e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,matis->y,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4653e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,matis->y,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4654906d46d4SStefano Zampini ierr = VecAXPY(x,-1.0,x_change);CHKERRQ(ierr); 4655906d46d4SStefano Zampini ierr = VecNorm(x,NORM_INFINITY,&error);CHKERRQ(ierr); 4656637e8532SStefano Zampini if (error > PETSC_SMALL) { 4657637e8532SStefano Zampini if (!pcbddc->user_ChangeOfBasisMatrix || pcbddc->current_level) { 4658637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on N: %1.6e\n",error); 4659637e8532SStefano Zampini } else { 4660637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Error global vs local change on N: %1.6e\n",error); 4661637e8532SStefano Zampini } 4662637e8532SStefano Zampini } 4663906d46d4SStefano Zampini ierr = VecDestroy(&x);CHKERRQ(ierr); 4664906d46d4SStefano Zampini ierr = VecDestroy(&x_change);CHKERRQ(ierr); 4665906d46d4SStefano Zampini } 4666906d46d4SStefano Zampini 4667022d8d2bSstefano_zampini /* lA is present if we are setting up an inner BDDC for a saddle point FETI-DP */ 4668022d8d2bSstefano_zampini ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject*)&lA);CHKERRQ(ierr); 4669022d8d2bSstefano_zampini 467022d5777bSStefano Zampini /* TODO: HOW TO WORK WITH BAIJ and SBAIJ and SEQDENSE? */ 46719b28b3ffSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)matis->A,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 467222d5777bSStefano Zampini if (isseqaij) { 4673a00504b5SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 4674a00504b5SStefano Zampini ierr = MatPtAP(matis->A,new_mat,MAT_INITIAL_MATRIX,2.0,&pcbddc->local_mat);CHKERRQ(ierr); 4675022d8d2bSstefano_zampini if (lA) { 4676022d8d2bSstefano_zampini Mat work; 4677022d8d2bSstefano_zampini ierr = MatPtAP(lA,new_mat,MAT_INITIAL_MATRIX,2.0,&work);CHKERRQ(ierr); 4678022d8d2bSstefano_zampini ierr = PetscObjectCompose((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject)work);CHKERRQ(ierr); 4679022d8d2bSstefano_zampini ierr = MatDestroy(&work);CHKERRQ(ierr); 4680022d8d2bSstefano_zampini } 4681aa0d41d4SStefano Zampini } else { 4682a00504b5SStefano Zampini Mat work_mat; 46831cf9b237SStefano Zampini 4684a00504b5SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 4685aa0d41d4SStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 4686a00504b5SStefano Zampini ierr = MatPtAP(work_mat,new_mat,MAT_INITIAL_MATRIX,2.0,&pcbddc->local_mat);CHKERRQ(ierr); 46871d82a3b6SStefano Zampini ierr = MatDestroy(&work_mat);CHKERRQ(ierr); 4688022d8d2bSstefano_zampini if (lA) { 4689022d8d2bSstefano_zampini Mat work; 4690022d8d2bSstefano_zampini ierr = MatConvert(lA,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 4691022d8d2bSstefano_zampini ierr = MatPtAP(work_mat,new_mat,MAT_INITIAL_MATRIX,2.0,&work);CHKERRQ(ierr); 4692022d8d2bSstefano_zampini ierr = PetscObjectCompose((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject)work);CHKERRQ(ierr); 4693022d8d2bSstefano_zampini ierr = MatDestroy(&work);CHKERRQ(ierr); 4694022d8d2bSstefano_zampini } 4695aa0d41d4SStefano Zampini } 46963301b35fSStefano Zampini if (matis->A->symmetric_set) { 46973301b35fSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_SYMMETRIC,matis->A->symmetric);CHKERRQ(ierr); 4698e496cd5dSStefano Zampini #if !defined(PETSC_USE_COMPLEX) 46993301b35fSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_HERMITIAN,matis->A->symmetric);CHKERRQ(ierr); 4700e496cd5dSStefano Zampini #endif 47013301b35fSStefano Zampini } 4702d65f70fdSStefano Zampini ierr = MatDestroy(&new_mat);CHKERRQ(ierr); 4703aa0d41d4SStefano Zampini PetscFunctionReturn(0); 4704aa0d41d4SStefano Zampini } 4705aa0d41d4SStefano Zampini 47068ce42a96SStefano Zampini PetscErrorCode PCBDDCSetUpLocalScatters(PC pc) 4707a64d13efSStefano Zampini { 4708a64d13efSStefano Zampini PC_IS* pcis = (PC_IS*)(pc->data); 4709a64d13efSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 4710d62866d3SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 471153892102SStefano Zampini PetscInt *idx_R_local=NULL; 47123a50541eSStefano Zampini PetscInt n_vertices,i,j,n_R,n_D,n_B; 47133a50541eSStefano Zampini PetscInt vbs,bs; 47146816873aSStefano Zampini PetscBT bitmask=NULL; 4715a64d13efSStefano Zampini PetscErrorCode ierr; 4716a64d13efSStefano Zampini 4717a64d13efSStefano Zampini PetscFunctionBegin; 4718b23d619eSStefano Zampini /* 4719b23d619eSStefano Zampini No need to setup local scatters if 4720b23d619eSStefano Zampini - primal space is unchanged 4721b23d619eSStefano Zampini AND 4722b23d619eSStefano Zampini - we actually have locally some primal dofs (could not be true in multilevel or for isolated subdomains) 4723b23d619eSStefano Zampini AND 4724b23d619eSStefano Zampini - we are not in debugging mode (this is needed since there are Synchronized prints at the end of the subroutine 4725b23d619eSStefano Zampini */ 4726b23d619eSStefano Zampini if (!pcbddc->new_primal_space_local && pcbddc->local_primal_size && !pcbddc->dbg_flag) { 4727f4ddd8eeSStefano Zampini PetscFunctionReturn(0); 4728f4ddd8eeSStefano Zampini } 4729f4ddd8eeSStefano Zampini /* destroy old objects */ 4730f4ddd8eeSStefano Zampini ierr = ISDestroy(&pcbddc->is_R_local);CHKERRQ(ierr); 4731f4ddd8eeSStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 4732f4ddd8eeSStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 4733a64d13efSStefano Zampini /* Set Non-overlapping dimensions */ 4734b371cd4fSStefano Zampini n_B = pcis->n_B; 4735b371cd4fSStefano Zampini n_D = pcis->n - n_B; 4736b371cd4fSStefano Zampini n_vertices = pcbddc->n_vertices; 47373a50541eSStefano Zampini 4738a64d13efSStefano Zampini /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 47396816873aSStefano Zampini 474053892102SStefano Zampini /* create auxiliary bitmask and allocate workspace */ 4741b334f244SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) { 4742854ce69bSBarry Smith ierr = PetscMalloc1(pcis->n-n_vertices,&idx_R_local);CHKERRQ(ierr); 4743a64d13efSStefano Zampini ierr = PetscBTCreate(pcis->n,&bitmask);CHKERRQ(ierr); 4744a64d13efSStefano Zampini for (i=0;i<n_vertices;i++) { 47450e6343abSStefano Zampini ierr = PetscBTSet(bitmask,pcbddc->local_primal_ref_node[i]);CHKERRQ(ierr); 4746a64d13efSStefano Zampini } 4747a64d13efSStefano Zampini 4748a64d13efSStefano Zampini for (i=0, n_R=0; i<pcis->n; i++) { 47494641a718SStefano Zampini if (!PetscBTLookup(bitmask,i)) { 47506816873aSStefano Zampini idx_R_local[n_R++] = i; 4751a64d13efSStefano Zampini } 4752a64d13efSStefano Zampini } 4753df4d28bfSStefano Zampini } else { /* A different ordering (already computed) is present if we are reusing the Schur solver */ 4754df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 47556816873aSStefano Zampini 4756df4d28bfSStefano Zampini ierr = ISGetIndices(reuse_solver->is_R,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4757df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->is_R,&n_R);CHKERRQ(ierr); 47586816873aSStefano Zampini } 47593a50541eSStefano Zampini 47603a50541eSStefano Zampini /* Block code */ 47613a50541eSStefano Zampini vbs = 1; 47623a50541eSStefano Zampini ierr = MatGetBlockSize(pcbddc->local_mat,&bs);CHKERRQ(ierr); 47633a50541eSStefano Zampini if (bs>1 && !(n_vertices%bs)) { 47643a50541eSStefano Zampini PetscBool is_blocked = PETSC_TRUE; 47653a50541eSStefano Zampini PetscInt *vary; 4766b334f244SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) { 4767785e854fSJed Brown ierr = PetscMalloc1(pcis->n/bs,&vary);CHKERRQ(ierr); 47683a50541eSStefano Zampini ierr = PetscMemzero(vary,pcis->n/bs*sizeof(PetscInt));CHKERRQ(ierr); 4769d3df7717SStefano Zampini /* Verify that the vertex indices correspond to each element in a block (code taken from sbaij2.c) */ 4770d3df7717SStefano Zampini /* it is ok to check this way since local_primal_ref_node are always sorted by local numbering and idx_R_local is obtained as a complement */ 47710e6343abSStefano Zampini for (i=0; i<n_vertices; i++) vary[pcbddc->local_primal_ref_node[i]/bs]++; 4772d3df7717SStefano Zampini for (i=0; i<pcis->n/bs; i++) { 47733a50541eSStefano Zampini if (vary[i]!=0 && vary[i]!=bs) { 47743a50541eSStefano Zampini is_blocked = PETSC_FALSE; 47753a50541eSStefano Zampini break; 47763a50541eSStefano Zampini } 47773a50541eSStefano Zampini } 4778d3df7717SStefano Zampini ierr = PetscFree(vary);CHKERRQ(ierr); 4779d3df7717SStefano Zampini } else { 4780d3df7717SStefano Zampini /* Verify directly the R set */ 4781d3df7717SStefano Zampini for (i=0; i<n_R/bs; i++) { 4782d3df7717SStefano Zampini PetscInt j,node=idx_R_local[bs*i]; 4783d3df7717SStefano Zampini for (j=1; j<bs; j++) { 4784d3df7717SStefano Zampini if (node != idx_R_local[bs*i+j]-j) { 4785d3df7717SStefano Zampini is_blocked = PETSC_FALSE; 4786d3df7717SStefano Zampini break; 4787d3df7717SStefano Zampini } 4788d3df7717SStefano Zampini } 4789d3df7717SStefano Zampini } 4790d3df7717SStefano Zampini } 47913a50541eSStefano Zampini if (is_blocked) { /* build compressed IS for R nodes (complement of vertices) */ 47923a50541eSStefano Zampini vbs = bs; 47933a50541eSStefano Zampini for (i=0;i<n_R/vbs;i++) { 47943a50541eSStefano Zampini idx_R_local[i] = idx_R_local[vbs*i]/vbs; 47953a50541eSStefano Zampini } 47963a50541eSStefano Zampini } 47973a50541eSStefano Zampini } 47983a50541eSStefano Zampini ierr = ISCreateBlock(PETSC_COMM_SELF,vbs,n_R/vbs,idx_R_local,PETSC_COPY_VALUES,&pcbddc->is_R_local);CHKERRQ(ierr); 4799b334f244SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { 4800df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 480153892102SStefano Zampini 4802df4d28bfSStefano Zampini ierr = ISRestoreIndices(reuse_solver->is_R,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4803df4d28bfSStefano Zampini ierr = ISDestroy(&reuse_solver->is_R);CHKERRQ(ierr); 480453892102SStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->is_R_local);CHKERRQ(ierr); 4805df4d28bfSStefano Zampini reuse_solver->is_R = pcbddc->is_R_local; 480653892102SStefano Zampini } else { 48073a50541eSStefano Zampini ierr = PetscFree(idx_R_local);CHKERRQ(ierr); 480853892102SStefano Zampini } 4809a64d13efSStefano Zampini 4810a64d13efSStefano Zampini /* print some info if requested */ 4811a64d13efSStefano Zampini if (pcbddc->dbg_flag) { 4812a64d13efSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 4813a64d13efSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 48141575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 4815a64d13efSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 4816a64d13efSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 48174f1b2e48SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,pcbddc->local_primal_size-n_vertices-pcbddc->benign_n,pcbddc->local_primal_size);CHKERRQ(ierr); 4818a64d13efSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 4819a64d13efSStefano Zampini } 4820a64d13efSStefano Zampini 4821a64d13efSStefano Zampini /* VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 4822b334f244SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) { 48236816873aSStefano Zampini IS is_aux1,is_aux2; 48246816873aSStefano Zampini PetscInt *aux_array1,*aux_array2,*is_indices,*idx_R_local; 48256816873aSStefano Zampini 48263a50541eSStefano Zampini ierr = ISGetIndices(pcbddc->is_R_local,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4827854ce69bSBarry Smith ierr = PetscMalloc1(pcis->n_B-n_vertices,&aux_array1);CHKERRQ(ierr); 4828854ce69bSBarry Smith ierr = PetscMalloc1(pcis->n_B-n_vertices,&aux_array2);CHKERRQ(ierr); 4829a64d13efSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 48304641a718SStefano Zampini for (i=0; i<n_D; i++) { 48314641a718SStefano Zampini ierr = PetscBTSet(bitmask,is_indices[i]);CHKERRQ(ierr); 48324641a718SStefano Zampini } 4833a64d13efSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4834a64d13efSStefano Zampini for (i=0, j=0; i<n_R; i++) { 48354641a718SStefano Zampini if (!PetscBTLookup(bitmask,idx_R_local[i])) { 48364641a718SStefano Zampini aux_array1[j++] = i; 4837a64d13efSStefano Zampini } 4838a64d13efSStefano Zampini } 4839a64d13efSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_OWN_POINTER,&is_aux1);CHKERRQ(ierr); 4840a64d13efSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4841a64d13efSStefano Zampini for (i=0, j=0; i<n_B; i++) { 48424641a718SStefano Zampini if (!PetscBTLookup(bitmask,is_indices[i])) { 48434641a718SStefano Zampini aux_array2[j++] = i; 4844a64d13efSStefano Zampini } 4845a64d13efSStefano Zampini } 4846a64d13efSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4847a64d13efSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_OWN_POINTER,&is_aux2);CHKERRQ(ierr); 4848a64d13efSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 4849a64d13efSStefano Zampini ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 4850a64d13efSStefano Zampini ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 4851a64d13efSStefano Zampini 48528eeda7d8SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 4853785e854fSJed Brown ierr = PetscMalloc1(n_D,&aux_array1);CHKERRQ(ierr); 4854a64d13efSStefano Zampini for (i=0, j=0; i<n_R; i++) { 48554641a718SStefano Zampini if (PetscBTLookup(bitmask,idx_R_local[i])) { 48564641a718SStefano Zampini aux_array1[j++] = i; 4857a64d13efSStefano Zampini } 4858a64d13efSStefano Zampini } 4859a64d13efSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_OWN_POINTER,&is_aux1);CHKERRQ(ierr); 4860a64d13efSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 4861a64d13efSStefano Zampini ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 4862a64d13efSStefano Zampini } 48634641a718SStefano Zampini ierr = PetscBTDestroy(&bitmask);CHKERRQ(ierr); 48643a50541eSStefano Zampini ierr = ISRestoreIndices(pcbddc->is_R_local,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4865d62866d3SStefano Zampini } else { 4866df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 48676816873aSStefano Zampini IS tis; 48686816873aSStefano Zampini PetscInt schur_size; 48696816873aSStefano Zampini 4870df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->is_B,&schur_size);CHKERRQ(ierr); 48716816873aSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,schur_size,n_D,1,&tis);CHKERRQ(ierr); 4872df4d28bfSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,tis,pcis->vec1_B,reuse_solver->is_B,&pcbddc->R_to_B);CHKERRQ(ierr); 48736816873aSStefano Zampini ierr = ISDestroy(&tis);CHKERRQ(ierr); 48746816873aSStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 48756816873aSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_D,0,1,&tis);CHKERRQ(ierr); 48766816873aSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,tis,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 48776816873aSStefano Zampini ierr = ISDestroy(&tis);CHKERRQ(ierr); 4878d62866d3SStefano Zampini } 4879d62866d3SStefano Zampini } 4880a64d13efSStefano Zampini PetscFunctionReturn(0); 4881a64d13efSStefano Zampini } 4882a64d13efSStefano Zampini 4883304d26faSStefano Zampini 4884684f6988SStefano Zampini PetscErrorCode PCBDDCSetUpLocalSolvers(PC pc, PetscBool dirichlet, PetscBool neumann) 4885304d26faSStefano Zampini { 4886304d26faSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 4887304d26faSStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 4888304d26faSStefano Zampini PC pc_temp; 4889304d26faSStefano Zampini Mat A_RR; 4890f4ddd8eeSStefano Zampini MatReuse reuse; 4891304d26faSStefano Zampini PetscScalar m_one = -1.0; 4892304d26faSStefano Zampini PetscReal value; 489304708bb6SStefano Zampini PetscInt n_D,n_R; 489435529e7bSStefano Zampini PetscBool check_corr,issbaij; 4895304d26faSStefano Zampini PetscErrorCode ierr; 4896e604994aSStefano Zampini /* prefixes stuff */ 4897312be037SStefano Zampini char dir_prefix[256],neu_prefix[256],str_level[16]; 4898e604994aSStefano Zampini size_t len; 4899304d26faSStefano Zampini 4900304d26faSStefano Zampini PetscFunctionBegin; 4901304d26faSStefano Zampini 4902e604994aSStefano Zampini /* compute prefixes */ 4903e604994aSStefano Zampini ierr = PetscStrcpy(dir_prefix,"");CHKERRQ(ierr); 4904e604994aSStefano Zampini ierr = PetscStrcpy(neu_prefix,"");CHKERRQ(ierr); 4905e604994aSStefano Zampini if (!pcbddc->current_level) { 4906e604994aSStefano Zampini ierr = PetscStrcpy(dir_prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr); 4907e604994aSStefano Zampini ierr = PetscStrcpy(neu_prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr); 4908e604994aSStefano Zampini ierr = PetscStrcat(dir_prefix,"pc_bddc_dirichlet_");CHKERRQ(ierr); 4909e604994aSStefano Zampini ierr = PetscStrcat(neu_prefix,"pc_bddc_neumann_");CHKERRQ(ierr); 4910e604994aSStefano Zampini } else { 491135529e7bSStefano Zampini ierr = PetscSNPrintf(str_level,sizeof(str_level),"l%d_",(int)(pcbddc->current_level));CHKERRQ(ierr); 4912e604994aSStefano Zampini ierr = PetscStrlen(((PetscObject)pc)->prefix,&len);CHKERRQ(ierr); 4913e604994aSStefano Zampini len -= 15; /* remove "pc_bddc_coarse_" */ 4914312be037SStefano Zampini if (pcbddc->current_level>1) len -= 3; /* remove "lX_" with X level number */ 4915312be037SStefano Zampini if (pcbddc->current_level>10) len -= 1; /* remove another char from level number */ 491634d6797cSStefano Zampini ierr = PetscStrncpy(dir_prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr); 491734d6797cSStefano Zampini ierr = PetscStrncpy(neu_prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr); 4918e604994aSStefano Zampini ierr = PetscStrcat(dir_prefix,"pc_bddc_dirichlet_");CHKERRQ(ierr); 4919e604994aSStefano Zampini ierr = PetscStrcat(neu_prefix,"pc_bddc_neumann_");CHKERRQ(ierr); 4920e604994aSStefano Zampini ierr = PetscStrcat(dir_prefix,str_level);CHKERRQ(ierr); 4921e604994aSStefano Zampini ierr = PetscStrcat(neu_prefix,str_level);CHKERRQ(ierr); 4922e604994aSStefano Zampini } 4923e604994aSStefano Zampini 4924304d26faSStefano Zampini /* DIRICHLET PROBLEM */ 4925684f6988SStefano Zampini if (dirichlet) { 4926d5574798SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 4927450f8f5eSStefano Zampini if (pcbddc->benign_n && !pcbddc->benign_change_explicit) { 49289a962809SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not yet implemented\n"); 4929450f8f5eSStefano Zampini if (pcbddc->dbg_flag) { 4930a3df083aSStefano Zampini Mat A_IIn; 4931a3df083aSStefano Zampini 4932a3df083aSStefano Zampini ierr = PCBDDCBenignProject(pc,pcis->is_I_local,pcis->is_I_local,&A_IIn);CHKERRQ(ierr); 4933a3df083aSStefano Zampini ierr = MatDestroy(&pcis->A_II);CHKERRQ(ierr); 4934a3df083aSStefano Zampini pcis->A_II = A_IIn; 4935a3df083aSStefano Zampini } 4936450f8f5eSStefano Zampini } 49373301b35fSStefano Zampini if (pcbddc->local_mat->symmetric_set) { 49383301b35fSStefano Zampini ierr = MatSetOption(pcis->A_II,MAT_SYMMETRIC,pcbddc->local_mat->symmetric_set);CHKERRQ(ierr); 4939964fefecSStefano Zampini } 4940ac78edfcSStefano Zampini /* Matrix for Dirichlet problem is pcis->A_II */ 4941964fefecSStefano Zampini n_D = pcis->n - pcis->n_B; 4942304d26faSStefano Zampini if (!pcbddc->ksp_D) { /* create object if not yet build */ 4943304d26faSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 4944304d26faSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 4945304d26faSStefano Zampini /* default */ 4946304d26faSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 4947e604994aSStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,dir_prefix);CHKERRQ(ierr); 49489577ea80SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcis->A_II,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr); 4949304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 49509577ea80SStefano Zampini if (issbaij) { 49519577ea80SStefano Zampini ierr = PCSetType(pc_temp,PCCHOLESKY);CHKERRQ(ierr); 49529577ea80SStefano Zampini } else { 4953304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 49549577ea80SStefano Zampini } 4955304d26faSStefano Zampini /* Allow user's customization */ 4956304d26faSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 4957304d26faSStefano Zampini ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr); 4958304d26faSStefano Zampini } 4959d1e9a80fSBarry Smith ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II);CHKERRQ(ierr); 4960b334f244SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { 4961df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 4962d62866d3SStefano Zampini 4963df4d28bfSStefano Zampini ierr = KSPSetPC(pcbddc->ksp_D,reuse_solver->interior_solver);CHKERRQ(ierr); 4964d5574798SStefano Zampini } 4965304d26faSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero. TODO solve from umfpack interface */ 4966304d26faSStefano Zampini if (!n_D) { 4967304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 4968304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 4969304d26faSStefano Zampini } 4970304d26faSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 4971304d26faSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 4972304d26faSStefano Zampini /* set ksp_D into pcis data */ 4973304d26faSStefano Zampini ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr); 4974304d26faSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr); 4975304d26faSStefano Zampini pcis->ksp_D = pcbddc->ksp_D; 4976684f6988SStefano Zampini } 4977304d26faSStefano Zampini 4978304d26faSStefano Zampini /* NEUMANN PROBLEM */ 4979684f6988SStefano Zampini A_RR = 0; 4980684f6988SStefano Zampini if (neumann) { 4981d62866d3SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 498204708bb6SStefano Zampini PetscInt ibs,mbs; 49830aa714b2SStefano Zampini PetscBool issbaij, reuse_neumann_solver; 498404708bb6SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 49850aa714b2SStefano Zampini 49860aa714b2SStefano Zampini reuse_neumann_solver = PETSC_FALSE; 49870aa714b2SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { 49880aa714b2SStefano Zampini IS iP; 49890aa714b2SStefano Zampini 49900aa714b2SStefano Zampini reuse_neumann_solver = PETSC_TRUE; 49910aa714b2SStefano Zampini ierr = PetscObjectQuery((PetscObject)sub_schurs->A,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr); 49920aa714b2SStefano Zampini if (iP) reuse_neumann_solver = PETSC_FALSE; 49930aa714b2SStefano Zampini } 4994f4ddd8eeSStefano Zampini /* Matrix for Neumann problem is A_RR -> we need to create/reuse it at this point */ 49958ce42a96SStefano Zampini ierr = ISGetSize(pcbddc->is_R_local,&n_R);CHKERRQ(ierr); 4996f4ddd8eeSStefano Zampini if (pcbddc->ksp_R) { /* already created ksp */ 4997f4ddd8eeSStefano Zampini PetscInt nn_R; 499881d9aea3SBarry Smith ierr = KSPGetOperators(pcbddc->ksp_R,NULL,&A_RR);CHKERRQ(ierr); 4999f4ddd8eeSStefano Zampini ierr = PetscObjectReference((PetscObject)A_RR);CHKERRQ(ierr); 5000f4ddd8eeSStefano Zampini ierr = MatGetSize(A_RR,&nn_R,NULL);CHKERRQ(ierr); 5001f4ddd8eeSStefano Zampini if (nn_R != n_R) { /* old ksp is not reusable, so reset it */ 5002f4ddd8eeSStefano Zampini ierr = KSPReset(pcbddc->ksp_R);CHKERRQ(ierr); 5003f4ddd8eeSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5004f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5005f4ddd8eeSStefano Zampini } else { /* same sizes, but nonzero pattern depend on primal vertices so it can be changed */ 5006727cdba6SStefano Zampini if (pcbddc->new_primal_space_local) { /* we are not sure the matrix will have the same nonzero pattern */ 5007f4ddd8eeSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5008f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5009f4ddd8eeSStefano Zampini } else { /* safe to reuse the matrix */ 5010f4ddd8eeSStefano Zampini reuse = MAT_REUSE_MATRIX; 5011f4ddd8eeSStefano Zampini } 5012f4ddd8eeSStefano Zampini } 5013f4ddd8eeSStefano Zampini /* last check */ 5014d1e9a80fSBarry Smith if (pc->flag == DIFFERENT_NONZERO_PATTERN) { 5015f4ddd8eeSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5016f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5017f4ddd8eeSStefano Zampini } 5018f4ddd8eeSStefano Zampini } else { /* first time, so we need to create the matrix */ 5019f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5020f4ddd8eeSStefano Zampini } 5021a00504b5SStefano Zampini /* convert pcbddc->local_mat if needed later in PCBDDCSetUpCorrection */ 5022af732b37SStefano Zampini ierr = MatGetBlockSize(pcbddc->local_mat,&mbs);CHKERRQ(ierr); 5023af732b37SStefano Zampini ierr = ISGetBlockSize(pcbddc->is_R_local,&ibs);CHKERRQ(ierr); 502404708bb6SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcbddc->local_mat,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr); 502504708bb6SStefano Zampini if (ibs != mbs) { /* need to convert to SEQAIJ to extract any submatrix with is_R_local */ 502604708bb6SStefano Zampini if (matis->A == pcbddc->local_mat) { 502704708bb6SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 502804708bb6SStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 5029af732b37SStefano Zampini } else { 5030511c6705SHong Zhang ierr = MatConvert(pcbddc->local_mat,MATSEQAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 50316816873aSStefano Zampini } 503204708bb6SStefano Zampini } else if (issbaij) { /* need to convert to BAIJ to get offdiagonal blocks */ 503304708bb6SStefano Zampini if (matis->A == pcbddc->local_mat) { 503404708bb6SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 503504708bb6SStefano Zampini ierr = MatConvert(matis->A,MATSEQBAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 503604708bb6SStefano Zampini } else { 5037511c6705SHong Zhang ierr = MatConvert(pcbddc->local_mat,MATSEQBAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 503804708bb6SStefano Zampini } 503904708bb6SStefano Zampini } 5040a00504b5SStefano Zampini /* extract A_RR */ 50410aa714b2SStefano Zampini if (reuse_neumann_solver) { 5042a00504b5SStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5043a00504b5SStefano Zampini 5044a00504b5SStefano Zampini if (pcbddc->dbg_flag) { /* we need A_RR to test the solver later */ 504516e386b8SStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5046a00504b5SStefano Zampini if (reuse_solver->benign_n) { /* we are not using the explicit change of basis on the pressures */ 504716e386b8SStefano Zampini ierr = PCBDDCBenignProject(pc,pcbddc->is_R_local,pcbddc->is_R_local,&A_RR);CHKERRQ(ierr); 504816e386b8SStefano Zampini } else { 50497dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 5050a00504b5SStefano Zampini } 5051a00504b5SStefano Zampini } else { 5052a00504b5SStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5053a00504b5SStefano Zampini ierr = PCGetOperators(reuse_solver->correction_solver,&A_RR,NULL);CHKERRQ(ierr); 5054a00504b5SStefano Zampini ierr = PetscObjectReference((PetscObject)A_RR);CHKERRQ(ierr); 5055a00504b5SStefano Zampini } 5056a00504b5SStefano Zampini } else { /* we have to build the neumann solver, so we need to extract the relevant matrix */ 50577dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,pcbddc->is_R_local,reuse,&A_RR);CHKERRQ(ierr); 505816e386b8SStefano Zampini } 50593301b35fSStefano Zampini if (pcbddc->local_mat->symmetric_set) { 50603301b35fSStefano Zampini ierr = MatSetOption(A_RR,MAT_SYMMETRIC,pcbddc->local_mat->symmetric_set);CHKERRQ(ierr); 50616816873aSStefano Zampini } 5062f4ddd8eeSStefano Zampini if (!pcbddc->ksp_R) { /* create object if not present */ 5063304d26faSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 5064304d26faSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 5065304d26faSStefano Zampini /* default */ 5066304d26faSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 5067e604994aSStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,neu_prefix);CHKERRQ(ierr); 5068304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 50699577ea80SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A_RR,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr); 50709577ea80SStefano Zampini if (issbaij) { 50719577ea80SStefano Zampini ierr = PCSetType(pc_temp,PCCHOLESKY);CHKERRQ(ierr); 50729577ea80SStefano Zampini } else { 5073304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 50749577ea80SStefano Zampini } 5075304d26faSStefano Zampini /* Allow user's customization */ 5076304d26faSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 5077304d26faSStefano Zampini ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr); 5078304d26faSStefano Zampini } 5079304d26faSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero. TODO solve from umfpack interface */ 5080304d26faSStefano Zampini if (!n_R) { 5081304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 5082304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 5083304d26faSStefano Zampini } 50845cbda25cSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR);CHKERRQ(ierr); 5085df4d28bfSStefano Zampini /* Reuse solver if it is present */ 50860aa714b2SStefano Zampini if (reuse_neumann_solver) { 5087df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5088d62866d3SStefano Zampini 5089df4d28bfSStefano Zampini ierr = KSPSetPC(pcbddc->ksp_R,reuse_solver->correction_solver);CHKERRQ(ierr); 5090d62866d3SStefano Zampini } 5091304d26faSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 5092304d26faSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 5093684f6988SStefano Zampini } 5094304d26faSStefano Zampini 5095684f6988SStefano Zampini if (pcbddc->dbg_flag) { 5096684f6988SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 50971575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 5098684f6988SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 5099684f6988SStefano Zampini } 5100c7017625SStefano Zampini 5101c7017625SStefano Zampini /* adapt Dirichlet and Neumann solvers if a nullspace correction has been requested */ 510235529e7bSStefano Zampini check_corr = PETSC_FALSE; 5103c7017625SStefano Zampini if (pcbddc->NullSpace_corr[0]) { 5104c7017625SStefano Zampini ierr = PCBDDCSetUseExactDirichlet(pc,PETSC_FALSE);CHKERRQ(ierr); 5105c7017625SStefano Zampini } 5106c7017625SStefano Zampini if (dirichlet && pcbddc->NullSpace_corr[0] && !pcbddc->switch_static) { 510735529e7bSStefano Zampini check_corr = PETSC_TRUE; 5108c7017625SStefano Zampini ierr = PCBDDCNullSpaceAssembleCorrection(pc,PETSC_TRUE,pcbddc->NullSpace_corr[1]);CHKERRQ(ierr); 5109c7017625SStefano Zampini } 5110c7017625SStefano Zampini if (neumann && pcbddc->NullSpace_corr[2]) { 511135529e7bSStefano Zampini check_corr = PETSC_TRUE; 5112c7017625SStefano Zampini ierr = PCBDDCNullSpaceAssembleCorrection(pc,PETSC_FALSE,pcbddc->NullSpace_corr[3]);CHKERRQ(ierr); 5113c7017625SStefano Zampini } 5114c7017625SStefano Zampini /* check Dirichlet and Neumann solvers */ 5115c7017625SStefano Zampini if (pcbddc->dbg_flag) { 5116684f6988SStefano Zampini if (dirichlet) { /* Dirichlet */ 51170fccc4e9SStefano Zampini ierr = VecSetRandom(pcis->vec1_D,NULL);CHKERRQ(ierr); 51180fccc4e9SStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 51190fccc4e9SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,pcis->vec2_D);CHKERRQ(ierr); 51200fccc4e9SStefano Zampini ierr = VecAXPY(pcis->vec1_D,m_one,pcis->vec2_D);CHKERRQ(ierr); 51210fccc4e9SStefano Zampini ierr = VecNorm(pcis->vec1_D,NORM_INFINITY,&value);CHKERRQ(ierr); 5122e604994aSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d infinity error for Dirichlet solve (%s) = % 1.14e \n",PetscGlobalRank,((PetscObject)(pcbddc->ksp_D))->prefix,value);CHKERRQ(ierr); 512335529e7bSStefano Zampini if (check_corr) { 5124c7017625SStefano Zampini ierr = PCBDDCNullSpaceCheckCorrection(pc,PETSC_TRUE);CHKERRQ(ierr); 5125c7017625SStefano Zampini } 5126304d26faSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 5127304d26faSStefano Zampini } 5128684f6988SStefano Zampini if (neumann) { /* Neumann */ 51290fccc4e9SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,NULL);CHKERRQ(ierr); 51300fccc4e9SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 51310fccc4e9SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 51320fccc4e9SStefano Zampini ierr = VecAXPY(pcbddc->vec1_R,m_one,pcbddc->vec2_R);CHKERRQ(ierr); 51330fccc4e9SStefano Zampini ierr = VecNorm(pcbddc->vec1_R,NORM_INFINITY,&value);CHKERRQ(ierr); 5134e604994aSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d infinity error for Neumann solve (%s) = % 1.14e\n",PetscGlobalRank,((PetscObject)(pcbddc->ksp_R))->prefix,value);CHKERRQ(ierr); 513535529e7bSStefano Zampini if (check_corr) { 5136c7017625SStefano Zampini ierr = PCBDDCNullSpaceCheckCorrection(pc,PETSC_FALSE);CHKERRQ(ierr); 5137c7017625SStefano Zampini } 5138304d26faSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 5139304d26faSStefano Zampini } 5140684f6988SStefano Zampini } 51415cbda25cSStefano Zampini /* free Neumann problem's matrix */ 51425cbda25cSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5143304d26faSStefano Zampini PetscFunctionReturn(0); 5144304d26faSStefano Zampini } 5145304d26faSStefano Zampini 514680677318SStefano Zampini static PetscErrorCode PCBDDCSolveSubstructureCorrection(PC pc, Vec inout_B, Vec inout_D, PetscBool applytranspose) 5147674ae819SStefano Zampini { 5148674ae819SStefano Zampini PetscErrorCode ierr; 5149674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 5150be83ff47SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 5151b334f244SStefano Zampini PetscBool reuse_solver = sub_schurs ? ( sub_schurs->reuse_solver ? PETSC_TRUE : PETSC_FALSE ) : PETSC_FALSE; 5152674ae819SStefano Zampini 5153674ae819SStefano Zampini PetscFunctionBegin; 5154b334f244SStefano Zampini if (!reuse_solver) { 515580677318SStefano Zampini ierr = VecSet(pcbddc->vec1_R,0.);CHKERRQ(ierr); 515620c7b377SStefano Zampini } 515780677318SStefano Zampini if (!pcbddc->switch_static) { 515880677318SStefano Zampini if (applytranspose && pcbddc->local_auxmat1) { 515980677318SStefano Zampini ierr = MatMultTranspose(pcbddc->local_auxmat2,inout_B,pcbddc->vec1_C);CHKERRQ(ierr); 516080677318SStefano Zampini ierr = MatMultTransposeAdd(pcbddc->local_auxmat1,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr); 516120c7b377SStefano Zampini } 5162b334f244SStefano Zampini if (!reuse_solver) { 516380677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 516480677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 516520c7b377SStefano Zampini } else { 5166df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5167be83ff47SStefano Zampini 5168df4d28bfSStefano Zampini ierr = VecScatterBegin(reuse_solver->correction_scatter_B,inout_B,reuse_solver->rhs_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5169df4d28bfSStefano Zampini ierr = VecScatterEnd(reuse_solver->correction_scatter_B,inout_B,reuse_solver->rhs_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 517020c7b377SStefano Zampini } 5171be83ff47SStefano Zampini } else { 517280677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517380677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517480677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,inout_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517580677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,inout_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517680677318SStefano Zampini if (applytranspose && pcbddc->local_auxmat1) { 517780677318SStefano Zampini ierr = MatMultTranspose(pcbddc->local_auxmat2,pcbddc->vec1_R,pcbddc->vec1_C);CHKERRQ(ierr); 517880677318SStefano Zampini ierr = MatMultTransposeAdd(pcbddc->local_auxmat1,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr); 517980677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 518080677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5181674ae819SStefano Zampini } 5182674ae819SStefano Zampini } 5183b334f244SStefano Zampini if (!reuse_solver || pcbddc->switch_static) { 518480677318SStefano Zampini if (applytranspose) { 518580677318SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 518680677318SStefano Zampini } else { 518780677318SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 518880677318SStefano Zampini } 5189be83ff47SStefano Zampini } else { 5190df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5191be83ff47SStefano Zampini 5192be83ff47SStefano Zampini if (applytranspose) { 5193df4d28bfSStefano Zampini ierr = MatFactorSolveSchurComplementTranspose(reuse_solver->F,reuse_solver->rhs_B,reuse_solver->sol_B);CHKERRQ(ierr); 5194be83ff47SStefano Zampini } else { 5195df4d28bfSStefano Zampini ierr = MatFactorSolveSchurComplement(reuse_solver->F,reuse_solver->rhs_B,reuse_solver->sol_B);CHKERRQ(ierr); 5196be83ff47SStefano Zampini } 5197be83ff47SStefano Zampini } 519880677318SStefano Zampini ierr = VecSet(inout_B,0.);CHKERRQ(ierr); 519980677318SStefano Zampini if (!pcbddc->switch_static) { 5200b334f244SStefano Zampini if (!reuse_solver) { 520180677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 520280677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5203be83ff47SStefano Zampini } else { 5204df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5205be83ff47SStefano Zampini 5206df4d28bfSStefano Zampini ierr = VecScatterBegin(reuse_solver->correction_scatter_B,reuse_solver->sol_B,inout_B,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5207df4d28bfSStefano Zampini ierr = VecScatterEnd(reuse_solver->correction_scatter_B,reuse_solver->sol_B,inout_B,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5208be83ff47SStefano Zampini } 520980677318SStefano Zampini if (!applytranspose && pcbddc->local_auxmat1) { 521080677318SStefano Zampini ierr = MatMult(pcbddc->local_auxmat1,inout_B,pcbddc->vec1_C);CHKERRQ(ierr); 521180677318SStefano Zampini ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr); 521280677318SStefano Zampini } 521380677318SStefano Zampini } else { 521480677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521580677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521680677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521780677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521880677318SStefano Zampini if (!applytranspose && pcbddc->local_auxmat1) { 521980677318SStefano Zampini ierr = MatMult(pcbddc->local_auxmat1,inout_B,pcbddc->vec1_C);CHKERRQ(ierr); 522080677318SStefano Zampini ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 522180677318SStefano Zampini } 522280677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 522380677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 522480677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 522580677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5226674ae819SStefano Zampini } 5227674ae819SStefano Zampini PetscFunctionReturn(0); 5228674ae819SStefano Zampini } 5229674ae819SStefano Zampini 5230dc359a40SStefano Zampini /* parameter apply transpose determines if the interface preconditioner should be applied transposed or not */ 5231dc359a40SStefano Zampini PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc, PetscBool applytranspose) 5232674ae819SStefano Zampini { 5233674ae819SStefano Zampini PetscErrorCode ierr; 5234674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 5235674ae819SStefano Zampini PC_IS* pcis = (PC_IS*) (pc->data); 5236674ae819SStefano Zampini const PetscScalar zero = 0.0; 5237674ae819SStefano Zampini 5238674ae819SStefano Zampini PetscFunctionBegin; 5239dc359a40SStefano Zampini /* Application of PSI^T or PHI^T (depending on applytranspose, see comment above) */ 52404fee134fSStefano Zampini if (!pcbddc->benign_apply_coarse_only) { 5241dc359a40SStefano Zampini if (applytranspose) { 5242674ae819SStefano Zampini ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 52438eeda7d8SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 5244dc359a40SStefano Zampini } else { 5245674ae819SStefano Zampini ierr = MatMultTranspose(pcbddc->coarse_psi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 5246674ae819SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultTransposeAdd(pcbddc->coarse_psi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 524715aaf578SStefano Zampini } 52484fee134fSStefano Zampini } else { 52494fee134fSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 52504fee134fSStefano Zampini } 5251efc2fbd9SStefano Zampini 5252efc2fbd9SStefano Zampini /* add p0 to the last value of vec1_P holding the coarse dof relative to p0 */ 52534f1b2e48SStefano Zampini if (pcbddc->benign_n) { 5254efc2fbd9SStefano Zampini PetscScalar *array; 52554f1b2e48SStefano Zampini PetscInt j; 5256efc2fbd9SStefano Zampini 5257efc2fbd9SStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 52584f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) array[pcbddc->local_primal_size-pcbddc->benign_n+j] += pcbddc->benign_p0[j]; 5259efc2fbd9SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 5260efc2fbd9SStefano Zampini } 5261efc2fbd9SStefano Zampini 526212edc857SStefano Zampini /* start communications from local primal nodes to rhs of coarse solver */ 526312edc857SStefano Zampini ierr = VecSet(pcbddc->coarse_vec,zero);CHKERRQ(ierr); 526412edc857SStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 526512edc857SStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 526612edc857SStefano Zampini 52679f00e9b4SStefano Zampini /* Coarse solution -> rhs and sol updated inside PCBDDCScattarCoarseDataBegin/End */ 526812edc857SStefano Zampini if (pcbddc->coarse_ksp) { 526951694757SStefano Zampini Mat coarse_mat; 5270964fefecSStefano Zampini Vec rhs,sol; 527151694757SStefano Zampini MatNullSpace nullsp; 527227b6a85dSStefano Zampini PetscBool isbddc = PETSC_FALSE; 5273964fefecSStefano Zampini 527427b6a85dSStefano Zampini if (pcbddc->benign_have_null) { 527527b6a85dSStefano Zampini PC coarse_pc; 527627b6a85dSStefano Zampini 527727b6a85dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr); 527827b6a85dSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)coarse_pc,PCBDDC,&isbddc);CHKERRQ(ierr); 527927b6a85dSStefano Zampini /* we need to propagate to coarser levels the need for a possible benign correction */ 528027b6a85dSStefano Zampini if (isbddc && pcbddc->benign_apply_coarse_only && !pcbddc->benign_skip_correction) { 528127b6a85dSStefano Zampini PC_BDDC* coarsepcbddc = (PC_BDDC*)(coarse_pc->data); 528227b6a85dSStefano Zampini coarsepcbddc->benign_skip_correction = PETSC_FALSE; 52833bca92a6SStefano Zampini coarsepcbddc->benign_apply_coarse_only = PETSC_TRUE; 528427b6a85dSStefano Zampini } 528527b6a85dSStefano Zampini } 5286964fefecSStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&rhs);CHKERRQ(ierr); 5287964fefecSStefano Zampini ierr = KSPGetSolution(pcbddc->coarse_ksp,&sol);CHKERRQ(ierr); 528851694757SStefano Zampini ierr = KSPGetOperators(pcbddc->coarse_ksp,&coarse_mat,NULL);CHKERRQ(ierr); 528951694757SStefano Zampini ierr = MatGetNullSpace(coarse_mat,&nullsp);CHKERRQ(ierr); 529051694757SStefano Zampini if (nullsp) { 529151694757SStefano Zampini ierr = MatNullSpaceRemove(nullsp,rhs);CHKERRQ(ierr); 529251694757SStefano Zampini } 529312edc857SStefano Zampini if (applytranspose) { 52949a962809SStefano Zampini if (pcbddc->benign_apply_coarse_only) SETERRQ(PetscObjectComm((PetscObject)pcbddc->coarse_ksp),PETSC_ERR_SUP,"Not yet implemented"); 5295964fefecSStefano Zampini ierr = KSPSolveTranspose(pcbddc->coarse_ksp,rhs,sol);CHKERRQ(ierr); 52962701bc32SStefano Zampini } else { 52971f4df5f7SStefano Zampini if (pcbddc->benign_apply_coarse_only && isbddc) { /* need just to apply the coarse preconditioner during presolve */ 52982701bc32SStefano Zampini PC coarse_pc; 52992701bc32SStefano Zampini 53002701bc32SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr); 53012701bc32SStefano Zampini ierr = PCPreSolve(coarse_pc,pcbddc->coarse_ksp);CHKERRQ(ierr); 53023e589ea0SStefano Zampini ierr = PCBDDCBenignRemoveInterior(coarse_pc,rhs,sol);CHKERRQ(ierr); 53032701bc32SStefano Zampini ierr = PCPostSolve(coarse_pc,pcbddc->coarse_ksp);CHKERRQ(ierr); 530412edc857SStefano Zampini } else { 5305964fefecSStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,rhs,sol);CHKERRQ(ierr); 530612edc857SStefano Zampini } 53072701bc32SStefano Zampini } 53081d82a3b6SStefano Zampini /* we don't need the benign correction at coarser levels anymore */ 530927b6a85dSStefano Zampini if (pcbddc->benign_have_null && isbddc) { 531027b6a85dSStefano Zampini PC coarse_pc; 531127b6a85dSStefano Zampini PC_BDDC* coarsepcbddc; 531227b6a85dSStefano Zampini 531327b6a85dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr); 531427b6a85dSStefano Zampini coarsepcbddc = (PC_BDDC*)(coarse_pc->data); 531527b6a85dSStefano Zampini coarsepcbddc->benign_skip_correction = PETSC_TRUE; 53163bca92a6SStefano Zampini coarsepcbddc->benign_apply_coarse_only = PETSC_FALSE; 531727b6a85dSStefano Zampini } 531851694757SStefano Zampini if (nullsp) { 531951694757SStefano Zampini ierr = MatNullSpaceRemove(nullsp,sol);CHKERRQ(ierr); 532051694757SStefano Zampini } 532112edc857SStefano Zampini } 5322674ae819SStefano Zampini 5323674ae819SStefano Zampini /* Local solution on R nodes */ 53244fee134fSStefano Zampini if (pcis->n && !pcbddc->benign_apply_coarse_only) { 532580677318SStefano Zampini ierr = PCBDDCSolveSubstructureCorrection(pc,pcis->vec1_B,pcis->vec1_D,applytranspose);CHKERRQ(ierr); 53269f00e9b4SStefano Zampini } 53279f00e9b4SStefano Zampini /* communications from coarse sol to local primal nodes */ 53289f00e9b4SStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 532912edc857SStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5330674ae819SStefano Zampini 53314fee134fSStefano Zampini /* Sum contributions from the two levels */ 53324fee134fSStefano Zampini if (!pcbddc->benign_apply_coarse_only) { 5333dc359a40SStefano Zampini if (applytranspose) { 5334dc359a40SStefano Zampini ierr = MatMultAdd(pcbddc->coarse_psi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 5335dc359a40SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultAdd(pcbddc->coarse_psi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 5336dc359a40SStefano Zampini } else { 5337674ae819SStefano Zampini ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 53388eeda7d8SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 5339dc359a40SStefano Zampini } 5340efc2fbd9SStefano Zampini /* store p0 */ 53414f1b2e48SStefano Zampini if (pcbddc->benign_n) { 5342efc2fbd9SStefano Zampini PetscScalar *array; 53434f1b2e48SStefano Zampini PetscInt j; 5344efc2fbd9SStefano Zampini 5345efc2fbd9SStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 53464f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) pcbddc->benign_p0[j] = array[pcbddc->local_primal_size-pcbddc->benign_n+j]; 5347efc2fbd9SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 5348efc2fbd9SStefano Zampini } 53494fee134fSStefano Zampini } else { /* expand the coarse solution */ 53504fee134fSStefano Zampini if (applytranspose) { 53514fee134fSStefano Zampini ierr = MatMult(pcbddc->coarse_psi_B,pcbddc->vec1_P,pcis->vec1_B);CHKERRQ(ierr); 53524fee134fSStefano Zampini } else { 53534fee134fSStefano Zampini ierr = MatMult(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B);CHKERRQ(ierr); 53544fee134fSStefano Zampini } 53554fee134fSStefano Zampini } 5356674ae819SStefano Zampini PetscFunctionReturn(0); 5357674ae819SStefano Zampini } 5358674ae819SStefano Zampini 535912edc857SStefano Zampini PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,InsertMode imode, ScatterMode smode) 5360674ae819SStefano Zampini { 5361674ae819SStefano Zampini PetscErrorCode ierr; 5362674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 536358da7f69SStefano Zampini PetscScalar *array; 536412edc857SStefano Zampini Vec from,to; 5365674ae819SStefano Zampini 5366674ae819SStefano Zampini PetscFunctionBegin; 536712edc857SStefano Zampini if (smode == SCATTER_REVERSE) { /* from global to local -> get data from coarse solution */ 536812edc857SStefano Zampini from = pcbddc->coarse_vec; 536912edc857SStefano Zampini to = pcbddc->vec1_P; 537012edc857SStefano Zampini if (pcbddc->coarse_ksp) { /* get array from coarse processes */ 537112edc857SStefano Zampini Vec tvec; 537258da7f69SStefano Zampini 537358da7f69SStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr); 537458da7f69SStefano Zampini ierr = VecResetArray(tvec);CHKERRQ(ierr); 537512edc857SStefano Zampini ierr = KSPGetSolution(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr); 537658da7f69SStefano Zampini ierr = VecGetArray(tvec,&array);CHKERRQ(ierr); 537758da7f69SStefano Zampini ierr = VecPlaceArray(from,array);CHKERRQ(ierr); 537858da7f69SStefano Zampini ierr = VecRestoreArray(tvec,&array);CHKERRQ(ierr); 537912edc857SStefano Zampini } 538012edc857SStefano Zampini } else { /* from local to global -> put data in coarse right hand side */ 538112edc857SStefano Zampini from = pcbddc->vec1_P; 538212edc857SStefano Zampini to = pcbddc->coarse_vec; 538312edc857SStefano Zampini } 538412edc857SStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,from,to,imode,smode);CHKERRQ(ierr); 5385674ae819SStefano Zampini PetscFunctionReturn(0); 5386674ae819SStefano Zampini } 5387674ae819SStefano Zampini 538812edc857SStefano Zampini PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc, InsertMode imode, ScatterMode smode) 5389674ae819SStefano Zampini { 5390674ae819SStefano Zampini PetscErrorCode ierr; 5391674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 539258da7f69SStefano Zampini PetscScalar *array; 539312edc857SStefano Zampini Vec from,to; 5394674ae819SStefano Zampini 5395674ae819SStefano Zampini PetscFunctionBegin; 539612edc857SStefano Zampini if (smode == SCATTER_REVERSE) { /* from global to local -> get data from coarse solution */ 539712edc857SStefano Zampini from = pcbddc->coarse_vec; 539812edc857SStefano Zampini to = pcbddc->vec1_P; 539912edc857SStefano Zampini } else { /* from local to global -> put data in coarse right hand side */ 540012edc857SStefano Zampini from = pcbddc->vec1_P; 540112edc857SStefano Zampini to = pcbddc->coarse_vec; 540212edc857SStefano Zampini } 540312edc857SStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,from,to,imode,smode);CHKERRQ(ierr); 540412edc857SStefano Zampini if (smode == SCATTER_FORWARD) { 540512edc857SStefano Zampini if (pcbddc->coarse_ksp) { /* get array from coarse processes */ 540612edc857SStefano Zampini Vec tvec; 540758da7f69SStefano Zampini 540812edc857SStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr); 540958da7f69SStefano Zampini ierr = VecGetArray(to,&array);CHKERRQ(ierr); 541058da7f69SStefano Zampini ierr = VecPlaceArray(tvec,array);CHKERRQ(ierr); 541158da7f69SStefano Zampini ierr = VecRestoreArray(to,&array);CHKERRQ(ierr); 541258da7f69SStefano Zampini } 541358da7f69SStefano Zampini } else { 541458da7f69SStefano Zampini if (pcbddc->coarse_ksp) { /* restore array of pcbddc->coarse_vec */ 541558da7f69SStefano Zampini ierr = VecResetArray(from);CHKERRQ(ierr); 541612edc857SStefano Zampini } 541712edc857SStefano Zampini } 5418674ae819SStefano Zampini PetscFunctionReturn(0); 5419674ae819SStefano Zampini } 5420674ae819SStefano Zampini 5421984c4197SStefano Zampini /* uncomment for testing purposes */ 5422984c4197SStefano Zampini /* #define PETSC_MISSING_LAPACK_GESVD 1 */ 5423674ae819SStefano Zampini PetscErrorCode PCBDDCConstraintsSetUp(PC pc) 5424674ae819SStefano Zampini { 5425674ae819SStefano Zampini PetscErrorCode ierr; 5426674ae819SStefano Zampini PC_IS* pcis = (PC_IS*)(pc->data); 5427674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 5428674ae819SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 5429984c4197SStefano Zampini /* one and zero */ 5430984c4197SStefano Zampini PetscScalar one=1.0,zero=0.0; 5431984c4197SStefano Zampini /* space to store constraints and their local indices */ 54329162d606SStefano Zampini PetscScalar *constraints_data; 54339162d606SStefano Zampini PetscInt *constraints_idxs,*constraints_idxs_B; 54349162d606SStefano Zampini PetscInt *constraints_idxs_ptr,*constraints_data_ptr; 54359162d606SStefano Zampini PetscInt *constraints_n; 5436984c4197SStefano Zampini /* iterators */ 5437b3d85658SStefano Zampini PetscInt i,j,k,total_counts,total_counts_cc,cum; 5438984c4197SStefano Zampini /* BLAS integers */ 5439e310c8b4SStefano Zampini PetscBLASInt lwork,lierr; 5440e310c8b4SStefano Zampini PetscBLASInt Blas_N,Blas_M,Blas_K,Blas_one=1; 5441c4303822SStefano Zampini PetscBLASInt Blas_LDA,Blas_LDB,Blas_LDC; 5442727cdba6SStefano Zampini /* reuse */ 54430e6343abSStefano Zampini PetscInt olocal_primal_size,olocal_primal_size_cc; 54440e6343abSStefano Zampini PetscInt *olocal_primal_ref_node,*olocal_primal_ref_mult; 5445984c4197SStefano Zampini /* change of basis */ 5446b3d85658SStefano Zampini PetscBool qr_needed; 54479162d606SStefano Zampini PetscBT change_basis,qr_needed_idx; 5448984c4197SStefano Zampini /* auxiliary stuff */ 544964efe560SStefano Zampini PetscInt *nnz,*is_indices; 54508a0068c3SStefano Zampini PetscInt ncc; 5451984c4197SStefano Zampini /* some quantities */ 545245a1bb75SStefano Zampini PetscInt n_vertices,total_primal_vertices,valid_constraints; 5453a58a30b4SStefano Zampini PetscInt size_of_constraint,max_size_of_constraint=0,max_constraints,temp_constraints; 5454984c4197SStefano Zampini 5455674ae819SStefano Zampini PetscFunctionBegin; 54568e61c736SStefano Zampini /* Destroy Mat objects computed previously */ 54578e61c736SStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 54588e61c736SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 545916909a7fSStefano Zampini ierr = MatDestroy(&pcbddc->switch_static_change);CHKERRQ(ierr); 5460088faed8SStefano Zampini /* save info on constraints from previous setup (if any) */ 5461088faed8SStefano Zampini olocal_primal_size = pcbddc->local_primal_size; 54620e6343abSStefano Zampini olocal_primal_size_cc = pcbddc->local_primal_size_cc; 54630e6343abSStefano Zampini ierr = PetscMalloc2(olocal_primal_size_cc,&olocal_primal_ref_node,olocal_primal_size_cc,&olocal_primal_ref_mult);CHKERRQ(ierr); 54640e6343abSStefano Zampini ierr = PetscMemcpy(olocal_primal_ref_node,pcbddc->local_primal_ref_node,olocal_primal_size_cc*sizeof(PetscInt));CHKERRQ(ierr); 54650e6343abSStefano Zampini ierr = PetscMemcpy(olocal_primal_ref_mult,pcbddc->local_primal_ref_mult,olocal_primal_size_cc*sizeof(PetscInt));CHKERRQ(ierr); 54660e6343abSStefano Zampini ierr = PetscFree2(pcbddc->local_primal_ref_node,pcbddc->local_primal_ref_mult);CHKERRQ(ierr); 5467088faed8SStefano Zampini ierr = PetscFree(pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 5468cf5a6209SStefano Zampini 5469cf5a6209SStefano Zampini if (!pcbddc->adaptive_selection) { 54709162d606SStefano Zampini IS ISForVertices,*ISForFaces,*ISForEdges; 5471cf5a6209SStefano Zampini MatNullSpace nearnullsp; 5472cf5a6209SStefano Zampini const Vec *nearnullvecs; 5473cf5a6209SStefano Zampini Vec *localnearnullsp; 5474cf5a6209SStefano Zampini PetscScalar *array; 5475cf5a6209SStefano Zampini PetscInt n_ISForFaces,n_ISForEdges,nnsp_size; 5476cf5a6209SStefano Zampini PetscBool nnsp_has_cnst; 5477674ae819SStefano Zampini /* LAPACK working arrays for SVD or POD */ 5478b3d85658SStefano Zampini PetscBool skip_lapack,boolforchange; 5479674ae819SStefano Zampini PetscScalar *work; 5480674ae819SStefano Zampini PetscReal *singular_vals; 5481674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5482674ae819SStefano Zampini PetscReal *rwork; 5483674ae819SStefano Zampini #endif 5484674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5485674ae819SStefano Zampini PetscScalar *temp_basis,*correlation_mat; 5486674ae819SStefano Zampini #else 5487964fefecSStefano Zampini PetscBLASInt dummy_int=1; 5488964fefecSStefano Zampini PetscScalar dummy_scalar=1.; 5489674ae819SStefano Zampini #endif 5490674ae819SStefano Zampini 5491674ae819SStefano Zampini /* Get index sets for faces, edges and vertices from graph */ 5492d06fc5fdSStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,&n_ISForFaces,&ISForFaces,&n_ISForEdges,&ISForEdges,&ISForVertices);CHKERRQ(ierr); 5493e4d548c7SStefano Zampini /* print some info */ 54945c643e28SStefano Zampini if (pcbddc->dbg_flag && (!pcbddc->sub_schurs || pcbddc->sub_schurs_rebuild)) { 5495e4d548c7SStefano Zampini PetscInt nv; 5496e4d548c7SStefano Zampini 5497c8272957SStefano Zampini ierr = PCBDDCGraphASCIIView(pcbddc->mat_graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr); 5498e4d548c7SStefano Zampini ierr = ISGetSize(ISForVertices,&nv);CHKERRQ(ierr); 5499e4d548c7SStefano Zampini ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 5500e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 5501e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate vertices (%d)\n",PetscGlobalRank,nv,pcbddc->use_vertices);CHKERRQ(ierr); 5502e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate edges (%d)\n",PetscGlobalRank,n_ISForEdges,pcbddc->use_edges);CHKERRQ(ierr); 5503e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate faces (%d)\n",PetscGlobalRank,n_ISForFaces,pcbddc->use_faces);CHKERRQ(ierr); 5504e4d548c7SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 5505e4d548c7SStefano Zampini ierr = PetscViewerASCIIPopSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 5506e4d548c7SStefano Zampini } 5507e4d548c7SStefano Zampini 5508d06fc5fdSStefano Zampini /* free unneeded index sets */ 5509d06fc5fdSStefano Zampini if (!pcbddc->use_vertices) { 5510d06fc5fdSStefano Zampini ierr = ISDestroy(&ISForVertices);CHKERRQ(ierr); 5511674ae819SStefano Zampini } 5512d06fc5fdSStefano Zampini if (!pcbddc->use_edges) { 5513d06fc5fdSStefano Zampini for (i=0;i<n_ISForEdges;i++) { 5514d06fc5fdSStefano Zampini ierr = ISDestroy(&ISForEdges[i]);CHKERRQ(ierr); 5515d06fc5fdSStefano Zampini } 5516d06fc5fdSStefano Zampini ierr = PetscFree(ISForEdges);CHKERRQ(ierr); 5517d06fc5fdSStefano Zampini n_ISForEdges = 0; 5518d06fc5fdSStefano Zampini } 5519d06fc5fdSStefano Zampini if (!pcbddc->use_faces) { 5520d06fc5fdSStefano Zampini for (i=0;i<n_ISForFaces;i++) { 5521d06fc5fdSStefano Zampini ierr = ISDestroy(&ISForFaces[i]);CHKERRQ(ierr); 5522d06fc5fdSStefano Zampini } 5523d06fc5fdSStefano Zampini ierr = PetscFree(ISForFaces);CHKERRQ(ierr); 5524d06fc5fdSStefano Zampini n_ISForFaces = 0; 5525d06fc5fdSStefano Zampini } 552670022509SStefano Zampini 5527674ae819SStefano Zampini /* check if near null space is attached to global mat */ 5528674ae819SStefano Zampini ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 5529674ae819SStefano Zampini if (nearnullsp) { 5530674ae819SStefano Zampini ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 5531f4ddd8eeSStefano Zampini /* remove any stored info */ 5532f4ddd8eeSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->onearnullspace);CHKERRQ(ierr); 5533f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->onearnullvecs_state);CHKERRQ(ierr); 5534f4ddd8eeSStefano Zampini /* store information for BDDC solver reuse */ 5535f4ddd8eeSStefano Zampini ierr = PetscObjectReference((PetscObject)nearnullsp);CHKERRQ(ierr); 5536f4ddd8eeSStefano Zampini pcbddc->onearnullspace = nearnullsp; 5537473ba861SJed Brown ierr = PetscMalloc1(nnsp_size,&pcbddc->onearnullvecs_state);CHKERRQ(ierr); 5538f4ddd8eeSStefano Zampini for (i=0;i<nnsp_size;i++) { 5539f4ddd8eeSStefano Zampini ierr = PetscObjectStateGet((PetscObject)nearnullvecs[i],&pcbddc->onearnullvecs_state[i]);CHKERRQ(ierr); 5540f4ddd8eeSStefano Zampini } 5541984c4197SStefano Zampini } else { /* if near null space is not provided BDDC uses constants by default */ 5542984c4197SStefano Zampini nnsp_size = 0; 5543674ae819SStefano Zampini nnsp_has_cnst = PETSC_TRUE; 5544674ae819SStefano Zampini } 5545984c4197SStefano Zampini /* get max number of constraints on a single cc */ 5546984c4197SStefano Zampini max_constraints = nnsp_size; 5547984c4197SStefano Zampini if (nnsp_has_cnst) max_constraints++; 5548984c4197SStefano Zampini 5549674ae819SStefano Zampini /* 5550674ae819SStefano Zampini Evaluate maximum storage size needed by the procedure 55519162d606SStefano Zampini - Indices for connected component i stored at "constraints_idxs + constraints_idxs_ptr[i]" 55529162d606SStefano Zampini - Values for constraints on connected component i stored at "constraints_data + constraints_data_ptr[i]" 55539162d606SStefano Zampini There can be multiple constraints per connected component 5554674ae819SStefano Zampini */ 5555674ae819SStefano Zampini n_vertices = 0; 5556674ae819SStefano Zampini if (ISForVertices) { 5557674ae819SStefano Zampini ierr = ISGetSize(ISForVertices,&n_vertices);CHKERRQ(ierr); 5558674ae819SStefano Zampini } 55599162d606SStefano Zampini ncc = n_vertices+n_ISForFaces+n_ISForEdges; 55609162d606SStefano Zampini ierr = PetscMalloc3(ncc+1,&constraints_idxs_ptr,ncc+1,&constraints_data_ptr,ncc,&constraints_n);CHKERRQ(ierr); 55619162d606SStefano Zampini 55629162d606SStefano Zampini total_counts = n_ISForFaces+n_ISForEdges; 55639162d606SStefano Zampini total_counts *= max_constraints; 5564674ae819SStefano Zampini total_counts += n_vertices; 55654641a718SStefano Zampini ierr = PetscBTCreate(total_counts,&change_basis);CHKERRQ(ierr); 55669162d606SStefano Zampini 5567674ae819SStefano Zampini total_counts = 0; 5568674ae819SStefano Zampini max_size_of_constraint = 0; 5569674ae819SStefano Zampini for (i=0;i<n_ISForEdges+n_ISForFaces;i++) { 55709162d606SStefano Zampini IS used_is; 5571674ae819SStefano Zampini if (i<n_ISForEdges) { 55729162d606SStefano Zampini used_is = ISForEdges[i]; 5573674ae819SStefano Zampini } else { 55749162d606SStefano Zampini used_is = ISForFaces[i-n_ISForEdges]; 5575674ae819SStefano Zampini } 55769162d606SStefano Zampini ierr = ISGetSize(used_is,&j);CHKERRQ(ierr); 5577674ae819SStefano Zampini total_counts += j; 5578674ae819SStefano Zampini max_size_of_constraint = PetscMax(j,max_size_of_constraint); 5579674ae819SStefano Zampini } 55809162d606SStefano Zampini ierr = PetscMalloc3(total_counts*max_constraints+n_vertices,&constraints_data,total_counts+n_vertices,&constraints_idxs,total_counts+n_vertices,&constraints_idxs_B);CHKERRQ(ierr); 55819162d606SStefano Zampini 5582984c4197SStefano Zampini /* get local part of global near null space vectors */ 5583785e854fSJed Brown ierr = PetscMalloc1(nnsp_size,&localnearnullsp);CHKERRQ(ierr); 5584984c4197SStefano Zampini for (k=0;k<nnsp_size;k++) { 5585984c4197SStefano Zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 5586e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5587e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5588984c4197SStefano Zampini } 5589674ae819SStefano Zampini 5590242a89d7SStefano Zampini /* whether or not to skip lapack calls */ 5591242a89d7SStefano Zampini skip_lapack = PETSC_TRUE; 5592a773dcb8SStefano Zampini if (n_ISForFaces+n_ISForEdges && max_constraints > 1 && !pcbddc->use_nnsp_true) skip_lapack = PETSC_FALSE; 5593242a89d7SStefano Zampini 5594984c4197SStefano Zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd (or LAPACKsyev if SVD is missing) */ 5595a773dcb8SStefano Zampini if (!skip_lapack) { 5596674ae819SStefano Zampini PetscScalar temp_work; 5597911cabfeSStefano Zampini 5598674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5599984c4197SStefano Zampini /* Proper Orthogonal Decomposition (POD) using the snapshot method */ 5600785e854fSJed Brown ierr = PetscMalloc1(max_constraints*max_constraints,&correlation_mat);CHKERRQ(ierr); 5601785e854fSJed Brown ierr = PetscMalloc1(max_constraints,&singular_vals);CHKERRQ(ierr); 5602785e854fSJed Brown ierr = PetscMalloc1(max_size_of_constraint*max_constraints,&temp_basis);CHKERRQ(ierr); 5603674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5604785e854fSJed Brown ierr = PetscMalloc1(3*max_constraints,&rwork);CHKERRQ(ierr); 5605674ae819SStefano Zampini #endif 5606674ae819SStefano Zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 5607c8244a33SStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_N);CHKERRQ(ierr); 5608c8244a33SStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_LDA);CHKERRQ(ierr); 5609674ae819SStefano Zampini lwork = -1; 5610674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5611674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 5612c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,&temp_work,&lwork,&lierr)); 5613674ae819SStefano Zampini #else 5614c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,&temp_work,&lwork,rwork,&lierr)); 5615674ae819SStefano Zampini #endif 5616674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5617984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEV Lapack routine %d",(int)lierr); 5618674ae819SStefano Zampini #else /* on missing GESVD */ 5619674ae819SStefano Zampini /* SVD */ 5620674ae819SStefano Zampini PetscInt max_n,min_n; 5621674ae819SStefano Zampini max_n = max_size_of_constraint; 5622984c4197SStefano Zampini min_n = max_constraints; 5623984c4197SStefano Zampini if (max_size_of_constraint < max_constraints) { 5624674ae819SStefano Zampini min_n = max_size_of_constraint; 5625984c4197SStefano Zampini max_n = max_constraints; 5626674ae819SStefano Zampini } 5627785e854fSJed Brown ierr = PetscMalloc1(min_n,&singular_vals);CHKERRQ(ierr); 5628674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5629785e854fSJed Brown ierr = PetscMalloc1(5*min_n,&rwork);CHKERRQ(ierr); 5630674ae819SStefano Zampini #endif 5631674ae819SStefano Zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 5632674ae819SStefano Zampini lwork = -1; 5633e310c8b4SStefano Zampini ierr = PetscBLASIntCast(max_n,&Blas_M);CHKERRQ(ierr); 5634e310c8b4SStefano Zampini ierr = PetscBLASIntCast(min_n,&Blas_N);CHKERRQ(ierr); 5635b7d8b9f8SStefano Zampini ierr = PetscBLASIntCast(max_n,&Blas_LDA);CHKERRQ(ierr); 5636674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5637674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 56389162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,&constraints_data[0],&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr)); 5639674ae819SStefano Zampini #else 56409162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,&constraints_data[0],&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr)); 5641674ae819SStefano Zampini #endif 5642674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5643984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GESVD Lapack routine %d",(int)lierr); 5644984c4197SStefano Zampini #endif /* on missing GESVD */ 5645674ae819SStefano Zampini /* Allocate optimal workspace */ 5646674ae819SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work),&lwork);CHKERRQ(ierr); 5647854ce69bSBarry Smith ierr = PetscMalloc1(lwork,&work);CHKERRQ(ierr); 5648674ae819SStefano Zampini } 5649674ae819SStefano Zampini /* Now we can loop on constraining sets */ 5650674ae819SStefano Zampini total_counts = 0; 56519162d606SStefano Zampini constraints_idxs_ptr[0] = 0; 56529162d606SStefano Zampini constraints_data_ptr[0] = 0; 5653674ae819SStefano Zampini /* vertices */ 56549162d606SStefano Zampini if (n_vertices) { 5655674ae819SStefano Zampini ierr = ISGetIndices(ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 56569162d606SStefano Zampini ierr = PetscMemcpy(constraints_idxs,is_indices,n_vertices*sizeof(PetscInt));CHKERRQ(ierr); 5657674ae819SStefano Zampini for (i=0;i<n_vertices;i++) { 56589162d606SStefano Zampini constraints_n[total_counts] = 1; 56599162d606SStefano Zampini constraints_data[total_counts] = 1.0; 56609162d606SStefano Zampini constraints_idxs_ptr[total_counts+1] = constraints_idxs_ptr[total_counts]+1; 56619162d606SStefano Zampini constraints_data_ptr[total_counts+1] = constraints_data_ptr[total_counts]+1; 5662674ae819SStefano Zampini total_counts++; 5663674ae819SStefano Zampini } 5664674ae819SStefano Zampini ierr = ISRestoreIndices(ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5665674ae819SStefano Zampini n_vertices = total_counts; 5666674ae819SStefano Zampini } 5667984c4197SStefano Zampini 5668674ae819SStefano Zampini /* edges and faces */ 56699162d606SStefano Zampini total_counts_cc = total_counts; 5670911cabfeSStefano Zampini for (ncc=0;ncc<n_ISForEdges+n_ISForFaces;ncc++) { 56719162d606SStefano Zampini IS used_is; 56729162d606SStefano Zampini PetscBool idxs_copied = PETSC_FALSE; 56739162d606SStefano Zampini 5674911cabfeSStefano Zampini if (ncc<n_ISForEdges) { 56759162d606SStefano Zampini used_is = ISForEdges[ncc]; 5676984c4197SStefano Zampini boolforchange = pcbddc->use_change_of_basis; /* change or not the basis on the edge */ 5677674ae819SStefano Zampini } else { 56789162d606SStefano Zampini used_is = ISForFaces[ncc-n_ISForEdges]; 5679984c4197SStefano Zampini boolforchange = (PetscBool)(pcbddc->use_change_of_basis && pcbddc->use_change_on_faces); /* change or not the basis on the face */ 5680674ae819SStefano Zampini } 5681674ae819SStefano Zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 56829162d606SStefano Zampini 56839162d606SStefano Zampini ierr = ISGetSize(used_is,&size_of_constraint);CHKERRQ(ierr); 56849162d606SStefano Zampini ierr = ISGetIndices(used_is,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5685984c4197SStefano Zampini /* change of basis should not be performed on local periodic nodes */ 5686984c4197SStefano Zampini if (pcbddc->mat_graph->mirrors && pcbddc->mat_graph->mirrors[is_indices[0]]) boolforchange = PETSC_FALSE; 5687674ae819SStefano Zampini if (nnsp_has_cnst) { 56885b08dc53SStefano Zampini PetscScalar quad_value; 56899162d606SStefano Zampini 56909162d606SStefano Zampini ierr = PetscMemcpy(constraints_idxs + constraints_idxs_ptr[total_counts_cc],is_indices,size_of_constraint*sizeof(PetscInt));CHKERRQ(ierr); 56919162d606SStefano Zampini idxs_copied = PETSC_TRUE; 56929162d606SStefano Zampini 5693a773dcb8SStefano Zampini if (!pcbddc->use_nnsp_true) { 5694674ae819SStefano Zampini quad_value = (PetscScalar)(1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 5695a773dcb8SStefano Zampini } else { 5696a773dcb8SStefano Zampini quad_value = 1.0; 5697a773dcb8SStefano Zampini } 5698674ae819SStefano Zampini for (j=0;j<size_of_constraint;j++) { 56999162d606SStefano Zampini constraints_data[constraints_data_ptr[total_counts_cc]+j] = quad_value; 5700674ae819SStefano Zampini } 57019162d606SStefano Zampini temp_constraints++; 5702674ae819SStefano Zampini total_counts++; 5703674ae819SStefano Zampini } 5704674ae819SStefano Zampini for (k=0;k<nnsp_size;k++) { 5705984c4197SStefano Zampini PetscReal real_value; 57069162d606SStefano Zampini PetscScalar *ptr_to_data; 57079162d606SStefano Zampini 5708984c4197SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array);CHKERRQ(ierr); 57099162d606SStefano Zampini ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]+temp_constraints*size_of_constraint]; 5710674ae819SStefano Zampini for (j=0;j<size_of_constraint;j++) { 57119162d606SStefano Zampini ptr_to_data[j] = array[is_indices[j]]; 5712674ae819SStefano Zampini } 5713984c4197SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array);CHKERRQ(ierr); 5714984c4197SStefano Zampini /* check if array is null on the connected component */ 5715e310c8b4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 57169162d606SStefano Zampini PetscStackCallBLAS("BLASasum",real_value = BLASasum_(&Blas_N,ptr_to_data,&Blas_one)); 57175b08dc53SStefano Zampini if (real_value > 0.0) { /* keep indices and values */ 5718674ae819SStefano Zampini temp_constraints++; 5719674ae819SStefano Zampini total_counts++; 57209162d606SStefano Zampini if (!idxs_copied) { 57219162d606SStefano Zampini ierr = PetscMemcpy(constraints_idxs + constraints_idxs_ptr[total_counts_cc],is_indices,size_of_constraint*sizeof(PetscInt));CHKERRQ(ierr); 57229162d606SStefano Zampini idxs_copied = PETSC_TRUE; 5723674ae819SStefano Zampini } 5724674ae819SStefano Zampini } 57259162d606SStefano Zampini } 57269162d606SStefano Zampini ierr = ISRestoreIndices(used_is,(const PetscInt**)&is_indices);CHKERRQ(ierr); 572745a1bb75SStefano Zampini valid_constraints = temp_constraints; 5728eb97c9d2SStefano Zampini if (!pcbddc->use_nnsp_true && temp_constraints) { 5729a773dcb8SStefano Zampini if (temp_constraints == 1) { /* just normalize the constraint */ 57309162d606SStefano Zampini PetscScalar norm,*ptr_to_data; 57319162d606SStefano Zampini 57329162d606SStefano Zampini ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]]; 5733a773dcb8SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 57349162d606SStefano Zampini PetscStackCallBLAS("BLASdot",norm = BLASdot_(&Blas_N,ptr_to_data,&Blas_one,ptr_to_data,&Blas_one)); 5735a773dcb8SStefano Zampini norm = 1.0/PetscSqrtReal(PetscRealPart(norm)); 57369162d606SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&Blas_N,&norm,ptr_to_data,&Blas_one)); 5737a773dcb8SStefano Zampini } else { /* perform SVD */ 5738984c4197SStefano Zampini PetscReal tol = 1.0e-8; /* tolerance for retaining eigenmodes */ 57399162d606SStefano Zampini PetscScalar *ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]]; 5740674ae819SStefano Zampini 5741674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5742984c4197SStefano Zampini /* SVD: Y = U*S*V^H -> U (eigenvectors of Y*Y^H) = Y*V*(S)^\dag 5743984c4197SStefano Zampini POD: Y^H*Y = V*D*V^H, D = S^H*S -> U = Y*V*D^(-1/2) 5744984c4197SStefano Zampini -> When PETSC_USE_COMPLEX and PETSC_MISSING_LAPACK_GESVD are defined 5745984c4197SStefano Zampini the constraints basis will differ (by a complex factor with absolute value equal to 1) 5746984c4197SStefano Zampini from that computed using LAPACKgesvd 5747984c4197SStefano Zampini -> This is due to a different computation of eigenvectors in LAPACKheev 5748984c4197SStefano Zampini -> The quality of the POD-computed basis will be the same */ 5749984c4197SStefano Zampini ierr = PetscMemzero(correlation_mat,temp_constraints*temp_constraints*sizeof(PetscScalar));CHKERRQ(ierr); 5750674ae819SStefano Zampini /* Store upper triangular part of correlation matrix */ 5751e310c8b4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 5752984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5753674ae819SStefano Zampini for (j=0;j<temp_constraints;j++) { 5754674ae819SStefano Zampini for (k=0;k<j+1;k++) { 57559162d606SStefano Zampini PetscStackCallBLAS("BLASdot",correlation_mat[j*temp_constraints+k] = BLASdot_(&Blas_N,ptr_to_data+k*size_of_constraint,&Blas_one,ptr_to_data+j*size_of_constraint,&Blas_one)); 5756674ae819SStefano Zampini } 5757674ae819SStefano Zampini } 5758e310c8b4SStefano Zampini /* compute eigenvalues and eigenvectors of correlation matrix */ 5759e310c8b4SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr); 5760e310c8b4SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_LDA);CHKERRQ(ierr); 5761674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 5762c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,work,&lwork,&lierr)); 5763674ae819SStefano Zampini #else 5764c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,work,&lwork,rwork,&lierr)); 5765674ae819SStefano Zampini #endif 5766674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5767984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEV Lapack routine %d",(int)lierr); 5768984c4197SStefano Zampini /* retain eigenvalues greater than tol: note that LAPACKsyev gives eigs in ascending order */ 5769674ae819SStefano Zampini j = 0; 5770984c4197SStefano Zampini while (j < temp_constraints && singular_vals[j] < tol) j++; 5771674ae819SStefano Zampini total_counts = total_counts-j; 577245a1bb75SStefano Zampini valid_constraints = temp_constraints-j; 5773e310c8b4SStefano Zampini /* scale and copy POD basis into used quadrature memory */ 5774c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 5775c4303822SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr); 5776c4303822SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_K);CHKERRQ(ierr); 5777c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 5778c4303822SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_LDB);CHKERRQ(ierr); 5779c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDC);CHKERRQ(ierr); 5780674ae819SStefano Zampini if (j<temp_constraints) { 5781984c4197SStefano Zampini PetscInt ii; 5782984c4197SStefano Zampini for (k=j;k<temp_constraints;k++) singular_vals[k] = 1.0/PetscSqrtReal(singular_vals[k]); 5783674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 57849162d606SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&Blas_M,&Blas_N,&Blas_K,&one,ptr_to_data,&Blas_LDA,correlation_mat,&Blas_LDB,&zero,temp_basis,&Blas_LDC)); 5785674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5786984c4197SStefano Zampini for (k=0;k<temp_constraints-j;k++) { 5787674ae819SStefano Zampini for (ii=0;ii<size_of_constraint;ii++) { 57889162d606SStefano Zampini ptr_to_data[k*size_of_constraint+ii] = singular_vals[temp_constraints-1-k]*temp_basis[(temp_constraints-1-k)*size_of_constraint+ii]; 5789674ae819SStefano Zampini } 5790674ae819SStefano Zampini } 5791674ae819SStefano Zampini } 5792674ae819SStefano Zampini #else /* on missing GESVD */ 5793e310c8b4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 5794e310c8b4SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr); 5795b7d8b9f8SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 5796674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5797674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 57989162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,ptr_to_data,&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr)); 5799674ae819SStefano Zampini #else 58009162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,ptr_to_data,&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr)); 5801674ae819SStefano Zampini #endif 5802984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESVD Lapack routine %d",(int)lierr); 5803674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5804984c4197SStefano Zampini /* retain eigenvalues greater than tol: note that LAPACKgesvd gives eigs in descending order */ 5805e310c8b4SStefano Zampini k = temp_constraints; 5806e310c8b4SStefano Zampini if (k > size_of_constraint) k = size_of_constraint; 5807674ae819SStefano Zampini j = 0; 5808e310c8b4SStefano Zampini while (j < k && singular_vals[k-j-1] < tol) j++; 580945a1bb75SStefano Zampini valid_constraints = k-j; 5810911cabfeSStefano Zampini total_counts = total_counts-temp_constraints+valid_constraints; 5811984c4197SStefano Zampini #endif /* on missing GESVD */ 5812674ae819SStefano Zampini } 5813a773dcb8SStefano Zampini } 58149162d606SStefano Zampini /* update pointers information */ 58159162d606SStefano Zampini if (valid_constraints) { 58169162d606SStefano Zampini constraints_n[total_counts_cc] = valid_constraints; 58179162d606SStefano Zampini constraints_idxs_ptr[total_counts_cc+1] = constraints_idxs_ptr[total_counts_cc]+size_of_constraint; 58189162d606SStefano Zampini constraints_data_ptr[total_counts_cc+1] = constraints_data_ptr[total_counts_cc]+size_of_constraint*valid_constraints; 58199162d606SStefano Zampini /* set change_of_basis flag */ 582045a1bb75SStefano Zampini if (boolforchange) { 5821b3d85658SStefano Zampini PetscBTSet(change_basis,total_counts_cc); 58229162d606SStefano Zampini } 5823b3d85658SStefano Zampini total_counts_cc++; 582445a1bb75SStefano Zampini } 582545a1bb75SStefano Zampini } 5826984c4197SStefano Zampini /* free workspace */ 58278f1c130eSStefano Zampini if (!skip_lapack) { 5828984c4197SStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 5829984c4197SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5830984c4197SStefano Zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 5831984c4197SStefano Zampini #endif 5832984c4197SStefano Zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 5833984c4197SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5834984c4197SStefano Zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 5835984c4197SStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 5836984c4197SStefano Zampini #endif 5837984c4197SStefano Zampini } 5838984c4197SStefano Zampini for (k=0;k<nnsp_size;k++) { 5839984c4197SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 5840984c4197SStefano Zampini } 5841984c4197SStefano Zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 5842cf5a6209SStefano Zampini /* free index sets of faces, edges and vertices */ 5843cf5a6209SStefano Zampini for (i=0;i<n_ISForFaces;i++) { 5844cf5a6209SStefano Zampini ierr = ISDestroy(&ISForFaces[i]);CHKERRQ(ierr); 5845cf5a6209SStefano Zampini } 5846cf5a6209SStefano Zampini if (n_ISForFaces) { 5847cf5a6209SStefano Zampini ierr = PetscFree(ISForFaces);CHKERRQ(ierr); 5848cf5a6209SStefano Zampini } 5849cf5a6209SStefano Zampini for (i=0;i<n_ISForEdges;i++) { 5850cf5a6209SStefano Zampini ierr = ISDestroy(&ISForEdges[i]);CHKERRQ(ierr); 5851cf5a6209SStefano Zampini } 5852cf5a6209SStefano Zampini if (n_ISForEdges) { 5853cf5a6209SStefano Zampini ierr = PetscFree(ISForEdges);CHKERRQ(ierr); 5854cf5a6209SStefano Zampini } 5855cf5a6209SStefano Zampini ierr = ISDestroy(&ISForVertices);CHKERRQ(ierr); 585608122e43SStefano Zampini } else { 585708122e43SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 5858984c4197SStefano Zampini 585908122e43SStefano Zampini total_counts = 0; 586008122e43SStefano Zampini n_vertices = 0; 5861d62866d3SStefano Zampini if (sub_schurs->is_vertices && pcbddc->use_vertices) { 5862d62866d3SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_vertices,&n_vertices);CHKERRQ(ierr); 586308122e43SStefano Zampini } 586408122e43SStefano Zampini max_constraints = 0; 58659162d606SStefano Zampini total_counts_cc = 0; 586608122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs+n_vertices;i++) { 586708122e43SStefano Zampini total_counts += pcbddc->adaptive_constraints_n[i]; 58689162d606SStefano Zampini if (pcbddc->adaptive_constraints_n[i]) total_counts_cc++; 586908122e43SStefano Zampini max_constraints = PetscMax(max_constraints,pcbddc->adaptive_constraints_n[i]); 587008122e43SStefano Zampini } 58719162d606SStefano Zampini constraints_idxs_ptr = pcbddc->adaptive_constraints_idxs_ptr; 58729162d606SStefano Zampini constraints_data_ptr = pcbddc->adaptive_constraints_data_ptr; 58739162d606SStefano Zampini constraints_idxs = pcbddc->adaptive_constraints_idxs; 58749162d606SStefano Zampini constraints_data = pcbddc->adaptive_constraints_data; 587574d5cdf7SStefano Zampini /* constraints_n differs from pcbddc->adaptive_constraints_n */ 58769162d606SStefano Zampini ierr = PetscMalloc1(total_counts_cc,&constraints_n);CHKERRQ(ierr); 58779162d606SStefano Zampini total_counts_cc = 0; 58789162d606SStefano Zampini for (i=0;i<sub_schurs->n_subs+n_vertices;i++) { 58799162d606SStefano Zampini if (pcbddc->adaptive_constraints_n[i]) { 58809162d606SStefano Zampini constraints_n[total_counts_cc++] = pcbddc->adaptive_constraints_n[i]; 588108122e43SStefano Zampini } 588208122e43SStefano Zampini } 58839162d606SStefano Zampini #if 0 58849162d606SStefano Zampini printf("Found %d totals (%d)\n",total_counts_cc,total_counts); 58859162d606SStefano Zampini for (i=0;i<total_counts_cc;i++) { 58869162d606SStefano Zampini printf("const %d, start %d",i,constraints_idxs_ptr[i]); 58879162d606SStefano Zampini printf(" end %d:\n",constraints_idxs_ptr[i+1]); 58889162d606SStefano Zampini for (j=constraints_idxs_ptr[i];j<constraints_idxs_ptr[i+1];j++) { 58899162d606SStefano Zampini printf(" %d",constraints_idxs[j]); 58909162d606SStefano Zampini } 58919162d606SStefano Zampini printf("\n"); 58929162d606SStefano Zampini printf("number of cc: %d\n",constraints_n[i]); 58939162d606SStefano Zampini } 58941b968477SStefano Zampini for (i=0;i<n_vertices;i++) { 58958bec7fa6SStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] vertex %d, n %d\n",PetscGlobalRank,i,pcbddc->adaptive_constraints_n[i]); 58961b968477SStefano Zampini } 58971b968477SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 58988bec7fa6SStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] sub %d, edge %d, n %d\n",PetscGlobalRank,i,(PetscBool)PetscBTLookup(sub_schurs->is_edge,i),pcbddc->adaptive_constraints_n[i+n_vertices]); 58991b968477SStefano Zampini } 590008122e43SStefano Zampini #endif 590108122e43SStefano Zampini 59028bec7fa6SStefano Zampini max_size_of_constraint = 0; 59039162d606SStefano Zampini for (i=0;i<total_counts_cc;i++) max_size_of_constraint = PetscMax(max_size_of_constraint,constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]); 59049162d606SStefano Zampini ierr = PetscMalloc1(constraints_idxs_ptr[total_counts_cc],&constraints_idxs_B);CHKERRQ(ierr); 590508122e43SStefano Zampini /* Change of basis */ 5906b3d85658SStefano Zampini ierr = PetscBTCreate(total_counts_cc,&change_basis);CHKERRQ(ierr); 590708122e43SStefano Zampini if (pcbddc->use_change_of_basis) { 590808122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 590908122e43SStefano Zampini if (PetscBTLookup(sub_schurs->is_edge,i) || pcbddc->use_change_on_faces) { 5910b3d85658SStefano Zampini ierr = PetscBTSet(change_basis,i+n_vertices);CHKERRQ(ierr); 591108122e43SStefano Zampini } 591208122e43SStefano Zampini } 591308122e43SStefano Zampini } 591408122e43SStefano Zampini } 5915984c4197SStefano Zampini pcbddc->local_primal_size = total_counts; 59164f1b2e48SStefano Zampini ierr = PetscMalloc1(pcbddc->local_primal_size+pcbddc->benign_n,&pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 591708122e43SStefano Zampini 59189162d606SStefano Zampini /* map constraints_idxs in boundary numbering */ 59199162d606SStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,constraints_idxs_ptr[total_counts_cc],constraints_idxs,&i,constraints_idxs_B);CHKERRQ(ierr); 5920eee23b56SStefano Zampini if (i != constraints_idxs_ptr[total_counts_cc]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for constraints indices %D != %D\n",constraints_idxs_ptr[total_counts_cc],i); 5921674ae819SStefano Zampini 5922674ae819SStefano Zampini /* Create constraint matrix */ 5923674ae819SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 592416f15bc4SStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,MATAIJ);CHKERRQ(ierr); 5925984c4197SStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,pcbddc->local_primal_size,pcis->n,pcbddc->local_primal_size,pcis->n);CHKERRQ(ierr); 5926984c4197SStefano Zampini 5927984c4197SStefano Zampini /* find primal_dofs: subdomain corners plus dofs selected as primal after change of basis */ 5928a717540cSStefano Zampini /* determine if a QR strategy is needed for change of basis */ 5929a717540cSStefano Zampini qr_needed = PETSC_FALSE; 593074d5cdf7SStefano Zampini ierr = PetscBTCreate(total_counts_cc,&qr_needed_idx);CHKERRQ(ierr); 5931984c4197SStefano Zampini total_primal_vertices=0; 5932b3d85658SStefano Zampini pcbddc->local_primal_size_cc = 0; 59339162d606SStefano Zampini for (i=0;i<total_counts_cc;i++) { 59349162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 593572b8c272SStefano Zampini if (size_of_constraint == 1 && pcbddc->mat_graph->custom_minimal_size) { 59369162d606SStefano Zampini pcbddc->primal_indices_local_idxs[total_primal_vertices++] = constraints_idxs[constraints_idxs_ptr[i]]; 5937b3d85658SStefano Zampini pcbddc->local_primal_size_cc += 1; 593864efe560SStefano Zampini } else if (PetscBTLookup(change_basis,i)) { 59399162d606SStefano Zampini for (k=0;k<constraints_n[i];k++) { 59409162d606SStefano Zampini pcbddc->primal_indices_local_idxs[total_primal_vertices++] = constraints_idxs[constraints_idxs_ptr[i]+k]; 5941a717540cSStefano Zampini } 5942b3d85658SStefano Zampini pcbddc->local_primal_size_cc += constraints_n[i]; 594391af6908SStefano Zampini if (constraints_n[i] > 1 || pcbddc->use_qr_single) { 5944a717540cSStefano Zampini PetscBTSet(qr_needed_idx,i); 5945a717540cSStefano Zampini qr_needed = PETSC_TRUE; 5946a717540cSStefano Zampini } 5947fa434743SStefano Zampini } else { 5948b3d85658SStefano Zampini pcbddc->local_primal_size_cc += 1; 5949fa434743SStefano Zampini } 5950a717540cSStefano Zampini } 5951b371cd4fSStefano Zampini /* note that the local variable n_vertices used below stores the number of pointwise constraints */ 5952b371cd4fSStefano Zampini pcbddc->n_vertices = total_primal_vertices; 5953674ae819SStefano Zampini /* permute indices in order to have a sorted set of vertices */ 595470022509SStefano Zampini ierr = PetscSortInt(total_primal_vertices,pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 59554f1b2e48SStefano Zampini ierr = PetscMalloc2(pcbddc->local_primal_size_cc+pcbddc->benign_n,&pcbddc->local_primal_ref_node,pcbddc->local_primal_size_cc+pcbddc->benign_n,&pcbddc->local_primal_ref_mult);CHKERRQ(ierr); 59560e6343abSStefano Zampini ierr = PetscMemcpy(pcbddc->local_primal_ref_node,pcbddc->primal_indices_local_idxs,total_primal_vertices*sizeof(PetscInt));CHKERRQ(ierr); 59570e6343abSStefano Zampini for (i=0;i<total_primal_vertices;i++) pcbddc->local_primal_ref_mult[i] = 1; 5958984c4197SStefano Zampini 5959984c4197SStefano Zampini /* nonzero structure of constraint matrix */ 596074d5cdf7SStefano Zampini /* and get reference dof for local constraints */ 5961785e854fSJed Brown ierr = PetscMalloc1(pcbddc->local_primal_size,&nnz);CHKERRQ(ierr); 5962984c4197SStefano Zampini for (i=0;i<total_primal_vertices;i++) nnz[i] = 1; 596374d5cdf7SStefano Zampini 5964984c4197SStefano Zampini j = total_primal_vertices; 596574d5cdf7SStefano Zampini total_counts = total_primal_vertices; 5966b3d85658SStefano Zampini cum = total_primal_vertices; 59679162d606SStefano Zampini for (i=n_vertices;i<total_counts_cc;i++) { 59684641a718SStefano Zampini if (!PetscBTLookup(change_basis,i)) { 5969b3d85658SStefano Zampini pcbddc->local_primal_ref_node[cum] = constraints_idxs[constraints_idxs_ptr[i]]; 5970b3d85658SStefano Zampini pcbddc->local_primal_ref_mult[cum] = constraints_n[i]; 5971b3d85658SStefano Zampini cum++; 59729162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 597374d5cdf7SStefano Zampini for (k=0;k<constraints_n[i];k++) { 597474d5cdf7SStefano Zampini pcbddc->primal_indices_local_idxs[total_counts++] = constraints_idxs[constraints_idxs_ptr[i]+k]; 597574d5cdf7SStefano Zampini nnz[j+k] = size_of_constraint; 597674d5cdf7SStefano Zampini } 59779162d606SStefano Zampini j += constraints_n[i]; 5978674ae819SStefano Zampini } 5979674ae819SStefano Zampini } 5980674ae819SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 5981674ae819SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 5982088faed8SStefano Zampini 5983674ae819SStefano Zampini /* set values in constraint matrix */ 5984984c4197SStefano Zampini for (i=0;i<total_primal_vertices;i++) { 59850e6343abSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,pcbddc->local_primal_ref_node[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 5986674ae819SStefano Zampini } 5987984c4197SStefano Zampini total_counts = total_primal_vertices; 59889162d606SStefano Zampini for (i=n_vertices;i<total_counts_cc;i++) { 59894641a718SStefano Zampini if (!PetscBTLookup(change_basis,i)) { 59909162d606SStefano Zampini PetscInt *cols; 59919162d606SStefano Zampini 59929162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 59939162d606SStefano Zampini cols = constraints_idxs+constraints_idxs_ptr[i]; 59949162d606SStefano Zampini for (k=0;k<constraints_n[i];k++) { 59959162d606SStefano Zampini PetscInt row = total_counts+k; 59969162d606SStefano Zampini PetscScalar *vals; 59979162d606SStefano Zampini 59989162d606SStefano Zampini vals = constraints_data+constraints_data_ptr[i]+k*size_of_constraint; 59999162d606SStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&row,size_of_constraint,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 60009162d606SStefano Zampini } 60019162d606SStefano Zampini total_counts += constraints_n[i]; 6002674ae819SStefano Zampini } 6003674ae819SStefano Zampini } 6004674ae819SStefano Zampini /* assembling */ 6005674ae819SStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6006674ae819SStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6007088faed8SStefano Zampini 6008984c4197SStefano Zampini /* 60096a9046bcSBarry Smith ierr = PetscViewerPushFormat(PETSC_VIEWER_STDOUT_SELF,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 6010984c4197SStefano Zampini ierr = MatView(pcbddc->ConstraintMatrix,(PetscViewer)0);CHKERRQ(ierr); 6011f159cad9SBarry Smith ierr = PetscViewerPopFormat(PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr); 6012984c4197SStefano Zampini */ 6013674ae819SStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->use_change_of_basis is FALSE */ 6014674ae819SStefano Zampini if (pcbddc->use_change_of_basis) { 6015026de310SStefano Zampini /* dual and primal dofs on a single cc */ 6016984c4197SStefano Zampini PetscInt dual_dofs,primal_dofs; 6017984c4197SStefano Zampini /* working stuff for GEQRF */ 601881d9aea3SBarry Smith PetscScalar *qr_basis,*qr_tau = NULL,*qr_work,lqr_work_t; 6019984c4197SStefano Zampini PetscBLASInt lqr_work; 6020984c4197SStefano Zampini /* working stuff for UNGQR */ 6021984c4197SStefano Zampini PetscScalar *gqr_work,lgqr_work_t; 6022984c4197SStefano Zampini PetscBLASInt lgqr_work; 6023984c4197SStefano Zampini /* working stuff for TRTRS */ 6024984c4197SStefano Zampini PetscScalar *trs_rhs; 60253f08241aSStefano Zampini PetscBLASInt Blas_NRHS; 6026984c4197SStefano Zampini /* pointers for values insertion into change of basis matrix */ 6027984c4197SStefano Zampini PetscInt *start_rows,*start_cols; 6028984c4197SStefano Zampini PetscScalar *start_vals; 6029984c4197SStefano Zampini /* working stuff for values insertion */ 60304641a718SStefano Zampini PetscBT is_primal; 603164efe560SStefano Zampini PetscInt *aux_primal_numbering_B; 6032906d46d4SStefano Zampini /* matrix sizes */ 6033906d46d4SStefano Zampini PetscInt global_size,local_size; 6034906d46d4SStefano Zampini /* temporary change of basis */ 6035906d46d4SStefano Zampini Mat localChangeOfBasisMatrix; 6036cf5a6209SStefano Zampini /* extra space for debugging */ 6037cf5a6209SStefano Zampini PetscScalar *dbg_work; 6038984c4197SStefano Zampini 6039906d46d4SStefano Zampini /* local temporary change of basis acts on local interfaces -> dimension is n_B x n_B */ 6040906d46d4SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&localChangeOfBasisMatrix);CHKERRQ(ierr); 604116f15bc4SStefano Zampini ierr = MatSetType(localChangeOfBasisMatrix,MATAIJ);CHKERRQ(ierr); 6042bbb9e6c6SStefano Zampini ierr = MatSetSizes(localChangeOfBasisMatrix,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 6043906d46d4SStefano Zampini /* nonzeros for local mat */ 6044bbb9e6c6SStefano Zampini ierr = PetscMalloc1(pcis->n,&nnz);CHKERRQ(ierr); 60451dd7afcfSStefano Zampini if (!pcbddc->benign_change || pcbddc->fake_change) { 6046bbb9e6c6SStefano Zampini for (i=0;i<pcis->n;i++) nnz[i]=1; 60471dd7afcfSStefano Zampini } else { 60481dd7afcfSStefano Zampini const PetscInt *ii; 60491dd7afcfSStefano Zampini PetscInt n; 60501dd7afcfSStefano Zampini PetscBool flg_row; 60511dd7afcfSStefano Zampini ierr = MatGetRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,NULL,&flg_row);CHKERRQ(ierr); 60521dd7afcfSStefano Zampini for (i=0;i<n;i++) nnz[i] = ii[i+1]-ii[i]; 60531dd7afcfSStefano Zampini ierr = MatRestoreRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,NULL,&flg_row);CHKERRQ(ierr); 60541dd7afcfSStefano Zampini } 60559162d606SStefano Zampini for (i=n_vertices;i<total_counts_cc;i++) { 6056a717540cSStefano Zampini if (PetscBTLookup(change_basis,i)) { 60579162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 6058a717540cSStefano Zampini if (PetscBTLookup(qr_needed_idx,i)) { 60599162d606SStefano Zampini for (j=0;j<size_of_constraint;j++) nnz[constraints_idxs[constraints_idxs_ptr[i]+j]] = size_of_constraint; 6060a717540cSStefano Zampini } else { 60619162d606SStefano Zampini nnz[constraints_idxs[constraints_idxs_ptr[i]]] = size_of_constraint; 60629162d606SStefano Zampini for (j=1;j<size_of_constraint;j++) nnz[constraints_idxs[constraints_idxs_ptr[i]+j]] = 2; 6063a717540cSStefano Zampini } 6064a717540cSStefano Zampini } 6065a717540cSStefano Zampini } 6066906d46d4SStefano Zampini ierr = MatSeqAIJSetPreallocation(localChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 6067bbb9e6c6SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 60681dd7afcfSStefano Zampini /* Set interior change in the matrix */ 60691dd7afcfSStefano Zampini if (!pcbddc->benign_change || pcbddc->fake_change) { 6070bbb9e6c6SStefano Zampini for (i=0;i<pcis->n;i++) { 6071906d46d4SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 6072a717540cSStefano Zampini } 60731dd7afcfSStefano Zampini } else { 60741dd7afcfSStefano Zampini const PetscInt *ii,*jj; 60751dd7afcfSStefano Zampini PetscScalar *aa; 60761dd7afcfSStefano Zampini PetscInt n; 60771dd7afcfSStefano Zampini PetscBool flg_row; 60781dd7afcfSStefano Zampini ierr = MatGetRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&jj,&flg_row);CHKERRQ(ierr); 60791dd7afcfSStefano Zampini ierr = MatSeqAIJGetArray(pcbddc->benign_change,&aa);CHKERRQ(ierr); 60801dd7afcfSStefano Zampini for (i=0;i<n;i++) { 60811dd7afcfSStefano Zampini ierr = MatSetValues(localChangeOfBasisMatrix,1,&i,ii[i+1]-ii[i],jj+ii[i],aa+ii[i],INSERT_VALUES);CHKERRQ(ierr); 60821dd7afcfSStefano Zampini } 60831dd7afcfSStefano Zampini ierr = MatSeqAIJRestoreArray(pcbddc->benign_change,&aa);CHKERRQ(ierr); 60841dd7afcfSStefano Zampini ierr = MatRestoreRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&jj,&flg_row);CHKERRQ(ierr); 60851dd7afcfSStefano Zampini } 6086a717540cSStefano Zampini 6087a717540cSStefano Zampini if (pcbddc->dbg_flag) { 6088a717540cSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 6089a717540cSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Checking change of basis computation for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 6090a717540cSStefano Zampini } 6091a717540cSStefano Zampini 6092a717540cSStefano Zampini 6093a717540cSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 6094a717540cSStefano Zampini /* 6095a717540cSStefano Zampini Change of basis matrix is evaluated similarly to the FIRST APPROACH in 6096a717540cSStefano Zampini Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (see Sect 6.2.1) 6097a717540cSStefano Zampini 6098a6b551f4SStefano Zampini Basic blocks of change of basis matrix T computed by 6099a717540cSStefano Zampini 6100a6b551f4SStefano Zampini - Using the following block transformation if there is only a primal dof on the cc (and -pc_bddc_use_qr_single is not specified) 6101a6b551f4SStefano Zampini 6102a6b551f4SStefano Zampini | 1 0 ... 0 s_1/S | 6103a6b551f4SStefano Zampini | 0 1 ... 0 s_2/S | 6104a717540cSStefano Zampini | ... | 6105a6b551f4SStefano Zampini | 0 ... 1 s_{n-1}/S | 6106a6b551f4SStefano Zampini | -s_1/s_n ... -s_{n-1}/s_n s_n/S | 6107a717540cSStefano Zampini 6108a6b551f4SStefano Zampini with S = \sum_{i=1}^n s_i^2 6109a6b551f4SStefano Zampini NOTE: in the above example, the primal dof is the last one of the edge in LOCAL ordering 6110a6b551f4SStefano Zampini in the current implementation, the primal dof is the first one of the edge in GLOBAL ordering 6111a6b551f4SStefano Zampini 6112a6b551f4SStefano Zampini - QR decomposition of constraints otherwise 6113a717540cSStefano Zampini */ 6114a717540cSStefano Zampini if (qr_needed) { 6115984c4197SStefano Zampini /* space to store Q */ 6116854ce69bSBarry Smith ierr = PetscMalloc1(max_size_of_constraint*max_size_of_constraint,&qr_basis);CHKERRQ(ierr); 61174e64d54eSstefano_zampini /* array to store scaling factors for reflectors */ 61184e64d54eSstefano_zampini ierr = PetscMalloc1(max_constraints,&qr_tau);CHKERRQ(ierr); 6119984c4197SStefano Zampini /* first we issue queries for optimal work */ 61203f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_M);CHKERRQ(ierr); 61213f08241aSStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_N);CHKERRQ(ierr); 61223f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6123984c4197SStefano Zampini lqr_work = -1; 61243f08241aSStefano Zampini PetscStackCallBLAS("LAPACKgeqrf",LAPACKgeqrf_(&Blas_M,&Blas_N,qr_basis,&Blas_LDA,qr_tau,&lqr_work_t,&lqr_work,&lierr)); 6125984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GEQRF Lapack routine %d",(int)lierr); 6126984c4197SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lqr_work_t),&lqr_work);CHKERRQ(ierr); 6127785e854fSJed Brown ierr = PetscMalloc1((PetscInt)PetscRealPart(lqr_work_t),&qr_work);CHKERRQ(ierr); 6128984c4197SStefano Zampini lgqr_work = -1; 61293f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_M);CHKERRQ(ierr); 61303f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_N);CHKERRQ(ierr); 61313f08241aSStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_K);CHKERRQ(ierr); 61323f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 61333f08241aSStefano Zampini if (Blas_K>Blas_M) Blas_K=Blas_M; /* adjust just for computing optimal work */ 6134*c964aadfSJose E. Roman PetscStackCallBLAS("LAPACKorgqr",LAPACKorgqr_(&Blas_M,&Blas_N,&Blas_K,qr_basis,&Blas_LDA,qr_tau,&lgqr_work_t,&lgqr_work,&lierr)); 6135*c964aadfSJose E. Roman if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to ORGQR/UNGQR Lapack routine %d",(int)lierr); 6136984c4197SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lgqr_work_t),&lgqr_work);CHKERRQ(ierr); 6137785e854fSJed Brown ierr = PetscMalloc1((PetscInt)PetscRealPart(lgqr_work_t),&gqr_work);CHKERRQ(ierr); 6138984c4197SStefano Zampini /* array to store rhs and solution of triangular solver */ 6139785e854fSJed Brown ierr = PetscMalloc1(max_constraints*max_constraints,&trs_rhs);CHKERRQ(ierr); 6140a717540cSStefano Zampini /* allocating workspace for check */ 6141a717540cSStefano Zampini if (pcbddc->dbg_flag) { 6142cf5a6209SStefano Zampini ierr = PetscMalloc1(max_size_of_constraint*(max_constraints+max_size_of_constraint),&dbg_work);CHKERRQ(ierr); 6143a717540cSStefano Zampini } 6144a717540cSStefano Zampini } 6145984c4197SStefano Zampini /* array to store whether a node is primal or not */ 61464641a718SStefano Zampini ierr = PetscBTCreate(pcis->n_B,&is_primal);CHKERRQ(ierr); 6147473ba861SJed Brown ierr = PetscMalloc1(total_primal_vertices,&aux_primal_numbering_B);CHKERRQ(ierr); 61480e6343abSStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,total_primal_vertices,pcbddc->local_primal_ref_node,&i,aux_primal_numbering_B);CHKERRQ(ierr); 6149eee23b56SStefano Zampini if (i != total_primal_vertices) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for BDDC vertices! %D != %D\n",total_primal_vertices,i); 615039e2fb2aSStefano Zampini for (i=0;i<total_primal_vertices;i++) { 615139e2fb2aSStefano Zampini ierr = PetscBTSet(is_primal,aux_primal_numbering_B[i]);CHKERRQ(ierr); 615239e2fb2aSStefano Zampini } 615339e2fb2aSStefano Zampini ierr = PetscFree(aux_primal_numbering_B);CHKERRQ(ierr); 6154984c4197SStefano Zampini 6155a717540cSStefano Zampini /* loop on constraints and see whether or not they need a change of basis and compute it */ 61569162d606SStefano Zampini for (total_counts=n_vertices;total_counts<total_counts_cc;total_counts++) { 61579162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[total_counts+1]-constraints_idxs_ptr[total_counts]; 61584641a718SStefano Zampini if (PetscBTLookup(change_basis,total_counts)) { 6159984c4197SStefano Zampini /* get constraint info */ 61609162d606SStefano Zampini primal_dofs = constraints_n[total_counts]; 6161984c4197SStefano Zampini dual_dofs = size_of_constraint-primal_dofs; 6162984c4197SStefano Zampini 6163984c4197SStefano Zampini if (pcbddc->dbg_flag) { 61649162d606SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Constraints %d: %d need a change of basis (size %d)\n",total_counts,primal_dofs,size_of_constraint);CHKERRQ(ierr); 6165674ae819SStefano Zampini } 6166984c4197SStefano Zampini 6167fa434743SStefano Zampini if (PetscBTLookup(qr_needed_idx,total_counts)) { /* QR */ 6168a717540cSStefano Zampini 6169a717540cSStefano Zampini /* copy quadrature constraints for change of basis check */ 6170a717540cSStefano Zampini if (pcbddc->dbg_flag) { 61719162d606SStefano Zampini ierr = PetscMemcpy(dbg_work,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr); 6172a717540cSStefano Zampini } 6173984c4197SStefano Zampini /* copy temporary constraints into larger work vector (in order to store all columns of Q) */ 61749162d606SStefano Zampini ierr = PetscMemcpy(qr_basis,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr); 6175984c4197SStefano Zampini 6176984c4197SStefano Zampini /* compute QR decomposition of constraints */ 61773f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 61783f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr); 61793f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6180674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 61813f08241aSStefano Zampini PetscStackCallBLAS("LAPACKgeqrf",LAPACKgeqrf_(&Blas_M,&Blas_N,qr_basis,&Blas_LDA,qr_tau,qr_work,&lqr_work,&lierr)); 6182984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GEQRF Lapack routine %d",(int)lierr); 6183674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6184984c4197SStefano Zampini 6185984c4197SStefano Zampini /* explictly compute R^-T */ 6186984c4197SStefano Zampini ierr = PetscMemzero(trs_rhs,primal_dofs*primal_dofs*sizeof(*trs_rhs));CHKERRQ(ierr); 6187984c4197SStefano Zampini for (j=0;j<primal_dofs;j++) trs_rhs[j*(primal_dofs+1)] = 1.0; 61883f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr); 61893f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_NRHS);CHKERRQ(ierr); 61903f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 61913f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_LDB);CHKERRQ(ierr); 6192984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 61933f08241aSStefano Zampini PetscStackCallBLAS("LAPACKtrtrs",LAPACKtrtrs_("U","T","N",&Blas_N,&Blas_NRHS,qr_basis,&Blas_LDA,trs_rhs,&Blas_LDB,&lierr)); 6194984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in TRTRS Lapack routine %d",(int)lierr); 6195984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6196984c4197SStefano Zampini 6197a717540cSStefano Zampini /* explicitly compute all columns of Q (Q = [Q1 | Q2] ) overwriting QR factorization in qr_basis */ 61983f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 61993f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 62003f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_K);CHKERRQ(ierr); 62013f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6202984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6203*c964aadfSJose E. Roman PetscStackCallBLAS("LAPACKorgqr",LAPACKorgqr_(&Blas_M,&Blas_N,&Blas_K,qr_basis,&Blas_LDA,qr_tau,gqr_work,&lgqr_work,&lierr)); 6204*c964aadfSJose E. Roman if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in ORGQR/UNGQR Lapack routine %d",(int)lierr); 6205984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6206984c4197SStefano Zampini 6207984c4197SStefano Zampini /* first primal_dofs columns of Q need to be re-scaled in order to be unitary w.r.t constraints 6208984c4197SStefano Zampini i.e. C_{pxn}*Q_{nxn} should be equal to [I_pxp | 0_pxd] (see check below) 6209984c4197SStefano Zampini where n=size_of_constraint, p=primal_dofs, d=dual_dofs (n=p+d), I and 0 identity and null matrix resp. */ 62103f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 62113f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr); 62123f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_K);CHKERRQ(ierr); 62133f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 62143f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_LDB);CHKERRQ(ierr); 62153f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDC);CHKERRQ(ierr); 6216984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 62179162d606SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&Blas_M,&Blas_N,&Blas_K,&one,qr_basis,&Blas_LDA,trs_rhs,&Blas_LDB,&zero,constraints_data+constraints_data_ptr[total_counts],&Blas_LDC)); 6218984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 62199162d606SStefano Zampini ierr = PetscMemcpy(qr_basis,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr); 6220984c4197SStefano Zampini 6221984c4197SStefano Zampini /* insert values in change of basis matrix respecting global ordering of new primal dofs */ 62229162d606SStefano Zampini start_rows = &constraints_idxs[constraints_idxs_ptr[total_counts]]; 6223984c4197SStefano Zampini /* insert cols for primal dofs */ 6224984c4197SStefano Zampini for (j=0;j<primal_dofs;j++) { 6225984c4197SStefano Zampini start_vals = &qr_basis[j*size_of_constraint]; 62269162d606SStefano Zampini start_cols = &constraints_idxs[constraints_idxs_ptr[total_counts]+j]; 6227906d46d4SStefano Zampini ierr = MatSetValues(localChangeOfBasisMatrix,size_of_constraint,start_rows,1,start_cols,start_vals,INSERT_VALUES);CHKERRQ(ierr); 6228984c4197SStefano Zampini } 6229984c4197SStefano Zampini /* insert cols for dual dofs */ 6230984c4197SStefano Zampini for (j=0,k=0;j<dual_dofs;k++) { 62319162d606SStefano Zampini if (!PetscBTLookup(is_primal,constraints_idxs_B[constraints_idxs_ptr[total_counts]+k])) { 6232984c4197SStefano Zampini start_vals = &qr_basis[(primal_dofs+j)*size_of_constraint]; 62339162d606SStefano Zampini start_cols = &constraints_idxs[constraints_idxs_ptr[total_counts]+k]; 6234906d46d4SStefano Zampini ierr = MatSetValues(localChangeOfBasisMatrix,size_of_constraint,start_rows,1,start_cols,start_vals,INSERT_VALUES);CHKERRQ(ierr); 6235984c4197SStefano Zampini j++; 6236674ae819SStefano Zampini } 6237674ae819SStefano Zampini } 6238984c4197SStefano Zampini 6239984c4197SStefano Zampini /* check change of basis */ 6240984c4197SStefano Zampini if (pcbddc->dbg_flag) { 6241984c4197SStefano Zampini PetscInt ii,jj; 6242984c4197SStefano Zampini PetscBool valid_qr=PETSC_TRUE; 6243c4303822SStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_M);CHKERRQ(ierr); 6244c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 6245c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_K);CHKERRQ(ierr); 6246c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6247c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDB);CHKERRQ(ierr); 6248c4303822SStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_LDC);CHKERRQ(ierr); 6249984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6250cf5a6209SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&Blas_M,&Blas_N,&Blas_K,&one,dbg_work,&Blas_LDA,qr_basis,&Blas_LDB,&zero,&dbg_work[size_of_constraint*primal_dofs],&Blas_LDC)); 6251984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6252984c4197SStefano Zampini for (jj=0;jj<size_of_constraint;jj++) { 6253984c4197SStefano Zampini for (ii=0;ii<primal_dofs;ii++) { 6254cf5a6209SStefano Zampini if (ii != jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]) > 1.e-12) valid_qr = PETSC_FALSE; 6255cf5a6209SStefano Zampini if (ii == jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]-1.0) > 1.e-12) valid_qr = PETSC_FALSE; 6256674ae819SStefano Zampini } 6257674ae819SStefano Zampini } 6258984c4197SStefano Zampini if (!valid_qr) { 625922d5777bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> wrong change of basis!\n");CHKERRQ(ierr); 6260984c4197SStefano Zampini for (jj=0;jj<size_of_constraint;jj++) { 6261984c4197SStefano Zampini for (ii=0;ii<primal_dofs;ii++) { 6262cf5a6209SStefano Zampini if (ii != jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]) > 1.e-12) { 6263cf5a6209SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\tQr basis function %d is not orthogonal to constraint %d (%1.14e)!\n",jj,ii,PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii])); 6264674ae819SStefano Zampini } 6265cf5a6209SStefano Zampini if (ii == jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]-1.0) > 1.e-12) { 6266cf5a6209SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\tQr basis function %d is not unitary w.r.t constraint %d (%1.14e)!\n",jj,ii,PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii])); 6267984c4197SStefano Zampini } 6268984c4197SStefano Zampini } 6269984c4197SStefano Zampini } 6270674ae819SStefano Zampini } else { 627122d5777bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> right change of basis!\n");CHKERRQ(ierr); 6272674ae819SStefano Zampini } 6273674ae819SStefano Zampini } 6274a717540cSStefano Zampini } else { /* simple transformation block */ 6275a717540cSStefano Zampini PetscInt row,col; 6276a6b551f4SStefano Zampini PetscScalar val,norm; 6277a6b551f4SStefano Zampini 6278a6b551f4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 62799162d606SStefano Zampini PetscStackCallBLAS("BLASdot",norm = BLASdot_(&Blas_N,constraints_data+constraints_data_ptr[total_counts],&Blas_one,constraints_data+constraints_data_ptr[total_counts],&Blas_one)); 6280a717540cSStefano Zampini for (j=0;j<size_of_constraint;j++) { 62819162d606SStefano Zampini PetscInt row_B = constraints_idxs_B[constraints_idxs_ptr[total_counts]+j]; 62829162d606SStefano Zampini row = constraints_idxs[constraints_idxs_ptr[total_counts]+j]; 6283bbb9e6c6SStefano Zampini if (!PetscBTLookup(is_primal,row_B)) { 62849162d606SStefano Zampini col = constraints_idxs[constraints_idxs_ptr[total_counts]]; 6285906d46d4SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,row,row,1.0,INSERT_VALUES);CHKERRQ(ierr); 62869162d606SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,row,col,constraints_data[constraints_data_ptr[total_counts]+j]/norm,INSERT_VALUES);CHKERRQ(ierr); 6287a717540cSStefano Zampini } else { 6288a717540cSStefano Zampini for (k=0;k<size_of_constraint;k++) { 62899162d606SStefano Zampini col = constraints_idxs[constraints_idxs_ptr[total_counts]+k]; 6290a717540cSStefano Zampini if (row != col) { 62919162d606SStefano Zampini val = -constraints_data[constraints_data_ptr[total_counts]+k]/constraints_data[constraints_data_ptr[total_counts]]; 6292a717540cSStefano Zampini } else { 62939162d606SStefano Zampini val = constraints_data[constraints_data_ptr[total_counts]]/norm; 6294a717540cSStefano Zampini } 6295906d46d4SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,row,col,val,INSERT_VALUES);CHKERRQ(ierr); 6296a717540cSStefano Zampini } 6297a717540cSStefano Zampini } 6298a717540cSStefano Zampini } 629998a51de6SStefano Zampini if (pcbddc->dbg_flag) { 630022d5777bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> using standard change of basis\n");CHKERRQ(ierr); 6301a717540cSStefano Zampini } 6302674ae819SStefano Zampini } 6303984c4197SStefano Zampini } else { 6304984c4197SStefano Zampini if (pcbddc->dbg_flag) { 63059162d606SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Constraint %d does not need a change of basis (size %d)\n",total_counts,size_of_constraint);CHKERRQ(ierr); 6306674ae819SStefano Zampini } 6307674ae819SStefano Zampini } 6308674ae819SStefano Zampini } 6309a717540cSStefano Zampini 6310a717540cSStefano Zampini /* free workspace */ 6311a717540cSStefano Zampini if (qr_needed) { 6312984c4197SStefano Zampini if (pcbddc->dbg_flag) { 6313cf5a6209SStefano Zampini ierr = PetscFree(dbg_work);CHKERRQ(ierr); 6314984c4197SStefano Zampini } 6315984c4197SStefano Zampini ierr = PetscFree(trs_rhs);CHKERRQ(ierr); 6316984c4197SStefano Zampini ierr = PetscFree(qr_tau);CHKERRQ(ierr); 6317984c4197SStefano Zampini ierr = PetscFree(qr_work);CHKERRQ(ierr); 6318984c4197SStefano Zampini ierr = PetscFree(gqr_work);CHKERRQ(ierr); 6319984c4197SStefano Zampini ierr = PetscFree(qr_basis);CHKERRQ(ierr); 6320674ae819SStefano Zampini } 6321a717540cSStefano Zampini ierr = PetscBTDestroy(&is_primal);CHKERRQ(ierr); 6322906d46d4SStefano Zampini ierr = MatAssemblyBegin(localChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6323906d46d4SStefano Zampini ierr = MatAssemblyEnd(localChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6324906d46d4SStefano Zampini 6325906d46d4SStefano Zampini /* assembling of global change of variable */ 632688c03ad3SStefano Zampini if (!pcbddc->fake_change) { 6327bbb9e6c6SStefano Zampini Mat tmat; 632816f15bc4SStefano Zampini PetscInt bs; 632916f15bc4SStefano Zampini 6330906d46d4SStefano Zampini ierr = VecGetSize(pcis->vec1_global,&global_size);CHKERRQ(ierr); 6331906d46d4SStefano Zampini ierr = VecGetLocalSize(pcis->vec1_global,&local_size);CHKERRQ(ierr); 6332bbb9e6c6SStefano Zampini ierr = MatDuplicate(pc->pmat,MAT_DO_NOT_COPY_VALUES,&tmat);CHKERRQ(ierr); 6333bbb9e6c6SStefano Zampini ierr = MatISSetLocalMat(tmat,localChangeOfBasisMatrix);CHKERRQ(ierr); 6334bbb9e6c6SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pc),&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 6335bbb9e6c6SStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,MATAIJ);CHKERRQ(ierr); 633616f15bc4SStefano Zampini ierr = MatGetBlockSize(pc->pmat,&bs);CHKERRQ(ierr); 633716f15bc4SStefano Zampini ierr = MatSetBlockSize(pcbddc->ChangeOfBasisMatrix,bs);CHKERRQ(ierr); 6338906d46d4SStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,local_size,local_size,global_size,global_size);CHKERRQ(ierr); 6339bbb9e6c6SStefano Zampini ierr = MatISSetMPIXAIJPreallocation_Private(tmat,pcbddc->ChangeOfBasisMatrix,PETSC_TRUE);CHKERRQ(ierr); 6340bbb9e6c6SStefano Zampini ierr = MatISGetMPIXAIJ(tmat,MAT_REUSE_MATRIX,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 6341bbb9e6c6SStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 6342bbb9e6c6SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 6343bbb9e6c6SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 6344e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6345e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6346bbb9e6c6SStefano Zampini ierr = VecReciprocal(pcis->vec1_global);CHKERRQ(ierr); 6347bbb9e6c6SStefano Zampini ierr = MatDiagonalScale(pcbddc->ChangeOfBasisMatrix,pcis->vec1_global,NULL);CHKERRQ(ierr); 634888c03ad3SStefano Zampini 6349906d46d4SStefano Zampini /* check */ 6350906d46d4SStefano Zampini if (pcbddc->dbg_flag) { 6351906d46d4SStefano Zampini PetscReal error; 6352906d46d4SStefano Zampini Vec x,x_change; 6353906d46d4SStefano Zampini 6354906d46d4SStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&x);CHKERRQ(ierr); 6355906d46d4SStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&x_change);CHKERRQ(ierr); 6356906d46d4SStefano Zampini ierr = VecSetRandom(x,NULL);CHKERRQ(ierr); 6357906d46d4SStefano Zampini ierr = VecCopy(x,pcis->vec1_global);CHKERRQ(ierr); 6358e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,x,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6359e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,x,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6360bbb9e6c6SStefano Zampini ierr = MatMult(localChangeOfBasisMatrix,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 6361e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec2_N,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6362e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec2_N,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6363906d46d4SStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_global,x_change);CHKERRQ(ierr); 6364906d46d4SStefano Zampini ierr = VecAXPY(x,-1.0,x_change);CHKERRQ(ierr); 6365906d46d4SStefano Zampini ierr = VecNorm(x,NORM_INFINITY,&error);CHKERRQ(ierr); 6366637e8532SStefano Zampini if (error > PETSC_SMALL) { 6367637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on N: %1.6e\n",error); 6368637e8532SStefano Zampini } 6369906d46d4SStefano Zampini ierr = VecDestroy(&x);CHKERRQ(ierr); 6370906d46d4SStefano Zampini ierr = VecDestroy(&x_change);CHKERRQ(ierr); 6371906d46d4SStefano Zampini } 6372b96c3477SStefano Zampini /* adapt sub_schurs computed (if any) */ 6373b96c3477SStefano Zampini if (pcbddc->use_deluxe_scaling) { 6374b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs=pcbddc->sub_schurs; 6375bf3a8328SStefano Zampini 637613903a91SSatish Balay if (pcbddc->use_change_of_basis && pcbddc->adaptive_userdefined) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Cannot mix automatic change of basis, adaptive selection and user-defined constraints"); 6377b334f244SStefano Zampini if (sub_schurs && sub_schurs->S_Ej_all) { 6378ac632422SStefano Zampini Mat S_new,tmat; 6379bf3a8328SStefano Zampini IS is_all_N,is_V_Sall = NULL; 6380bbb9e6c6SStefano Zampini 6381bbb9e6c6SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pcis->BtoNmap,sub_schurs->is_Ej_all,&is_all_N);CHKERRQ(ierr); 63827dae84e0SHong Zhang ierr = MatCreateSubMatrix(localChangeOfBasisMatrix,is_all_N,is_all_N,MAT_INITIAL_MATRIX,&tmat);CHKERRQ(ierr); 6383bf3a8328SStefano Zampini if (pcbddc->deluxe_zerorows) { 6384bf3a8328SStefano Zampini ISLocalToGlobalMapping NtoSall; 6385bf3a8328SStefano Zampini IS is_V; 6386b087196eSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->n_vertices,pcbddc->local_primal_ref_node,PETSC_COPY_VALUES,&is_V);CHKERRQ(ierr); 6387b087196eSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_all_N,&NtoSall);CHKERRQ(ierr); 6388b087196eSStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(NtoSall,IS_GTOLM_DROP,is_V,&is_V_Sall);CHKERRQ(ierr); 6389b087196eSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&NtoSall);CHKERRQ(ierr); 6390b087196eSStefano Zampini ierr = ISDestroy(&is_V);CHKERRQ(ierr); 6391bf3a8328SStefano Zampini } 6392bf3a8328SStefano Zampini ierr = ISDestroy(&is_all_N);CHKERRQ(ierr); 6393ac632422SStefano Zampini ierr = MatPtAP(sub_schurs->S_Ej_all,tmat,MAT_INITIAL_MATRIX,1.0,&S_new);CHKERRQ(ierr); 6394b96c3477SStefano Zampini ierr = MatDestroy(&sub_schurs->S_Ej_all);CHKERRQ(ierr); 6395ac632422SStefano Zampini ierr = PetscObjectReference((PetscObject)S_new);CHKERRQ(ierr); 6396bf3a8328SStefano Zampini if (pcbddc->deluxe_zerorows) { 6397bf3a8328SStefano Zampini const PetscScalar *array; 6398bf3a8328SStefano Zampini const PetscInt *idxs_V,*idxs_all; 6399bf3a8328SStefano Zampini PetscInt i,n_V; 6400bf3a8328SStefano Zampini 6401b087196eSStefano Zampini ierr = MatZeroRowsColumnsIS(S_new,is_V_Sall,1.,NULL,NULL);CHKERRQ(ierr); 6402b087196eSStefano Zampini ierr = ISGetLocalSize(is_V_Sall,&n_V);CHKERRQ(ierr); 6403b087196eSStefano Zampini ierr = ISGetIndices(is_V_Sall,&idxs_V);CHKERRQ(ierr); 6404b087196eSStefano Zampini ierr = ISGetIndices(sub_schurs->is_Ej_all,&idxs_all);CHKERRQ(ierr); 6405b087196eSStefano Zampini ierr = VecGetArrayRead(pcis->D,&array);CHKERRQ(ierr); 6406b087196eSStefano Zampini for (i=0;i<n_V;i++) { 6407b087196eSStefano Zampini PetscScalar val; 6408b087196eSStefano Zampini PetscInt idx; 6409b087196eSStefano Zampini 6410b087196eSStefano Zampini idx = idxs_V[i]; 6411b087196eSStefano Zampini val = array[idxs_all[idxs_V[i]]]; 6412b087196eSStefano Zampini ierr = MatSetValue(S_new,idx,idx,val,INSERT_VALUES);CHKERRQ(ierr); 6413b087196eSStefano Zampini } 6414b087196eSStefano Zampini ierr = MatAssemblyBegin(S_new,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6415b087196eSStefano Zampini ierr = MatAssemblyEnd(S_new,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6416bf3a8328SStefano Zampini ierr = VecRestoreArrayRead(pcis->D,&array);CHKERRQ(ierr); 6417bf3a8328SStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_Ej_all,&idxs_all);CHKERRQ(ierr); 6418bf3a8328SStefano Zampini ierr = ISRestoreIndices(is_V_Sall,&idxs_V);CHKERRQ(ierr); 6419bf3a8328SStefano Zampini } 6420ac632422SStefano Zampini sub_schurs->S_Ej_all = S_new; 6421ac632422SStefano Zampini ierr = MatDestroy(&S_new);CHKERRQ(ierr); 6422ac632422SStefano Zampini if (sub_schurs->sum_S_Ej_all) { 6423ac632422SStefano Zampini ierr = MatPtAP(sub_schurs->sum_S_Ej_all,tmat,MAT_INITIAL_MATRIX,1.0,&S_new);CHKERRQ(ierr); 6424b96c3477SStefano Zampini ierr = MatDestroy(&sub_schurs->sum_S_Ej_all);CHKERRQ(ierr); 6425ac632422SStefano Zampini ierr = PetscObjectReference((PetscObject)S_new);CHKERRQ(ierr); 6426bf3a8328SStefano Zampini if (pcbddc->deluxe_zerorows) { 6427b087196eSStefano Zampini ierr = MatZeroRowsColumnsIS(S_new,is_V_Sall,1.,NULL,NULL);CHKERRQ(ierr); 6428bf3a8328SStefano Zampini } 6429ac632422SStefano Zampini sub_schurs->sum_S_Ej_all = S_new; 6430ac632422SStefano Zampini ierr = MatDestroy(&S_new);CHKERRQ(ierr); 6431ac632422SStefano Zampini } 6432b087196eSStefano Zampini ierr = ISDestroy(&is_V_Sall);CHKERRQ(ierr); 643388c03ad3SStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 6434b96c3477SStefano Zampini } 6435c9db6a07SStefano Zampini /* destroy any change of basis context in sub_schurs */ 6436b334f244SStefano Zampini if (sub_schurs && sub_schurs->change) { 6437c9db6a07SStefano Zampini PetscInt i; 6438c9db6a07SStefano Zampini 6439c9db6a07SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 6440c9db6a07SStefano Zampini ierr = KSPDestroy(&sub_schurs->change[i]);CHKERRQ(ierr); 6441c9db6a07SStefano Zampini } 6442c9db6a07SStefano Zampini ierr = PetscFree(sub_schurs->change);CHKERRQ(ierr); 6443c9db6a07SStefano Zampini } 6444b96c3477SStefano Zampini } 644516909a7fSStefano Zampini if (pcbddc->switch_static) { /* need to save the local change */ 644616909a7fSStefano Zampini pcbddc->switch_static_change = localChangeOfBasisMatrix; 644716909a7fSStefano Zampini } else { 6448906d46d4SStefano Zampini ierr = MatDestroy(&localChangeOfBasisMatrix);CHKERRQ(ierr); 644916909a7fSStefano Zampini } 64501dd7afcfSStefano Zampini /* determine if any process has changed the pressures locally */ 645127b6a85dSStefano Zampini pcbddc->change_interior = pcbddc->benign_have_null; 645272b8c272SStefano Zampini } else { /* fake change (get back change of basis into ConstraintMatrix and info on qr) */ 645372b8c272SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 645472b8c272SStefano Zampini pcbddc->ConstraintMatrix = localChangeOfBasisMatrix; 645572b8c272SStefano Zampini pcbddc->use_qr_single = qr_needed; 645672b8c272SStefano Zampini } 64571dd7afcfSStefano Zampini } else if (pcbddc->user_ChangeOfBasisMatrix || pcbddc->benign_saddle_point) { 645827b6a85dSStefano Zampini if (!pcbddc->benign_have_null && pcbddc->user_ChangeOfBasisMatrix) { 6459b9b85e73SStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->user_ChangeOfBasisMatrix);CHKERRQ(ierr); 6460b9b85e73SStefano Zampini pcbddc->ChangeOfBasisMatrix = pcbddc->user_ChangeOfBasisMatrix; 6461906d46d4SStefano Zampini } else { 64621dd7afcfSStefano Zampini Mat benign_global = NULL; 646327b6a85dSStefano Zampini if (pcbddc->benign_have_null) { 64641dd7afcfSStefano Zampini Mat tmat; 64651dd7afcfSStefano Zampini 64661dd7afcfSStefano Zampini pcbddc->change_interior = PETSC_TRUE; 64671dd7afcfSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 64681dd7afcfSStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 64691dd7afcfSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 64701dd7afcfSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 64711dd7afcfSStefano Zampini ierr = VecReciprocal(pcis->vec1_global);CHKERRQ(ierr); 64721dd7afcfSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 64731dd7afcfSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 64741dd7afcfSStefano Zampini ierr = MatDuplicate(pc->pmat,MAT_DO_NOT_COPY_VALUES,&tmat);CHKERRQ(ierr); 64751dd7afcfSStefano Zampini if (pcbddc->benign_change) { 64761dd7afcfSStefano Zampini Mat M; 64771dd7afcfSStefano Zampini 64781dd7afcfSStefano Zampini ierr = MatDuplicate(pcbddc->benign_change,MAT_COPY_VALUES,&M);CHKERRQ(ierr); 64791dd7afcfSStefano Zampini ierr = MatDiagonalScale(M,pcis->vec1_N,NULL);CHKERRQ(ierr); 64801dd7afcfSStefano Zampini ierr = MatISSetLocalMat(tmat,M);CHKERRQ(ierr); 64811dd7afcfSStefano Zampini ierr = MatDestroy(&M);CHKERRQ(ierr); 6482906d46d4SStefano Zampini } else { 64831dd7afcfSStefano Zampini Mat eye; 64841dd7afcfSStefano Zampini PetscScalar *array; 64851dd7afcfSStefano Zampini 64861dd7afcfSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 64871dd7afcfSStefano Zampini ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,pcis->n,pcis->n,1,NULL,&eye);CHKERRQ(ierr); 64881dd7afcfSStefano Zampini for (i=0;i<pcis->n;i++) { 64891dd7afcfSStefano Zampini ierr = MatSetValue(eye,i,i,array[i],INSERT_VALUES);CHKERRQ(ierr); 6490906d46d4SStefano Zampini } 64911dd7afcfSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 64921dd7afcfSStefano Zampini ierr = MatAssemblyBegin(eye,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 64931dd7afcfSStefano Zampini ierr = MatAssemblyEnd(eye,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 64941dd7afcfSStefano Zampini ierr = MatISSetLocalMat(tmat,eye);CHKERRQ(ierr); 64951dd7afcfSStefano Zampini ierr = MatDestroy(&eye);CHKERRQ(ierr); 64961dd7afcfSStefano Zampini } 64971dd7afcfSStefano Zampini ierr = MatISGetMPIXAIJ(tmat,MAT_INITIAL_MATRIX,&benign_global);CHKERRQ(ierr); 64981dd7afcfSStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 64991dd7afcfSStefano Zampini } 65001dd7afcfSStefano Zampini if (pcbddc->user_ChangeOfBasisMatrix) { 65011dd7afcfSStefano Zampini ierr = MatMatMult(pcbddc->user_ChangeOfBasisMatrix,benign_global,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 65021dd7afcfSStefano Zampini ierr = MatDestroy(&benign_global);CHKERRQ(ierr); 650327b6a85dSStefano Zampini } else if (pcbddc->benign_have_null) { 65041dd7afcfSStefano Zampini pcbddc->ChangeOfBasisMatrix = benign_global; 65051dd7afcfSStefano Zampini } 65061dd7afcfSStefano Zampini } 650716909a7fSStefano Zampini if (pcbddc->switch_static && pcbddc->ChangeOfBasisMatrix) { /* need to save the local change */ 650816909a7fSStefano Zampini IS is_global; 650916909a7fSStefano Zampini const PetscInt *gidxs; 651016909a7fSStefano Zampini 651116909a7fSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(pc->pmat->rmap->mapping,&gidxs);CHKERRQ(ierr); 651216909a7fSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),pcis->n,gidxs,PETSC_COPY_VALUES,&is_global);CHKERRQ(ierr); 651316909a7fSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(pc->pmat->rmap->mapping,&gidxs);CHKERRQ(ierr); 65147dae84e0SHong Zhang ierr = MatCreateSubMatrixUnsorted(pcbddc->ChangeOfBasisMatrix,is_global,is_global,&pcbddc->switch_static_change);CHKERRQ(ierr); 651516909a7fSStefano Zampini ierr = ISDestroy(&is_global);CHKERRQ(ierr); 651616909a7fSStefano Zampini } 65171dd7afcfSStefano Zampini } 65181dd7afcfSStefano Zampini if (!pcbddc->fake_change && pcbddc->ChangeOfBasisMatrix && !pcbddc->work_change) { 65191dd7afcfSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->work_change);CHKERRQ(ierr); 6520b9b85e73SStefano Zampini } 6521a717540cSStefano Zampini 652272b8c272SStefano Zampini if (!pcbddc->fake_change) { 65234f1b2e48SStefano Zampini /* add pressure dofs to set of primal nodes for numbering purposes */ 65244f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 65254f1b2e48SStefano Zampini pcbddc->local_primal_ref_node[pcbddc->local_primal_size_cc] = pcbddc->benign_p0_lidx[i]; 65264f1b2e48SStefano Zampini pcbddc->primal_indices_local_idxs[pcbddc->local_primal_size] = pcbddc->benign_p0_lidx[i]; 6527019a44ceSStefano Zampini pcbddc->local_primal_ref_mult[pcbddc->local_primal_size_cc] = 1; 6528019a44ceSStefano Zampini pcbddc->local_primal_size_cc++; 6529019a44ceSStefano Zampini pcbddc->local_primal_size++; 6530019a44ceSStefano Zampini } 6531019a44ceSStefano Zampini 6532019a44ceSStefano Zampini /* check if a new primal space has been introduced (also take into account benign trick) */ 6533727cdba6SStefano Zampini pcbddc->new_primal_space_local = PETSC_TRUE; 6534727cdba6SStefano Zampini if (olocal_primal_size == pcbddc->local_primal_size) { 65359f47a83aSStefano Zampini ierr = PetscMemcmp(pcbddc->local_primal_ref_node,olocal_primal_ref_node,olocal_primal_size_cc*sizeof(PetscInt),&pcbddc->new_primal_space_local);CHKERRQ(ierr); 6536c1c8e736SStefano Zampini pcbddc->new_primal_space_local = (PetscBool)(!pcbddc->new_primal_space_local); 65370e6343abSStefano Zampini if (!pcbddc->new_primal_space_local) { 65389f47a83aSStefano Zampini ierr = PetscMemcmp(pcbddc->local_primal_ref_mult,olocal_primal_ref_mult,olocal_primal_size_cc*sizeof(PetscInt),&pcbddc->new_primal_space_local);CHKERRQ(ierr); 6539727cdba6SStefano Zampini pcbddc->new_primal_space_local = (PetscBool)(!pcbddc->new_primal_space_local); 6540727cdba6SStefano Zampini } 65410e6343abSStefano Zampini } 6542727cdba6SStefano Zampini /* new_primal_space will be used for numbering of coarse dofs, so it should be the same across all subdomains */ 6543b2566f29SBarry Smith ierr = MPIU_Allreduce(&pcbddc->new_primal_space_local,&pcbddc->new_primal_space,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 654472b8c272SStefano Zampini } 654572b8c272SStefano Zampini ierr = PetscFree2(olocal_primal_ref_node,olocal_primal_ref_mult);CHKERRQ(ierr); 6546727cdba6SStefano Zampini 6547a717540cSStefano Zampini /* flush dbg viewer */ 6548b8ffe317SStefano Zampini if (pcbddc->dbg_flag) { 6549b8ffe317SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 6550b8ffe317SStefano Zampini } 6551a717540cSStefano Zampini 6552e310c8b4SStefano Zampini /* free workspace */ 6553a717540cSStefano Zampini ierr = PetscBTDestroy(&qr_needed_idx);CHKERRQ(ierr); 65544641a718SStefano Zampini ierr = PetscBTDestroy(&change_basis);CHKERRQ(ierr); 655508122e43SStefano Zampini if (!pcbddc->adaptive_selection) { 65569162d606SStefano Zampini ierr = PetscFree3(constraints_idxs_ptr,constraints_data_ptr,constraints_n);CHKERRQ(ierr); 65579162d606SStefano Zampini ierr = PetscFree3(constraints_data,constraints_idxs,constraints_idxs_B);CHKERRQ(ierr); 655808122e43SStefano Zampini } else { 65599162d606SStefano Zampini ierr = PetscFree5(pcbddc->adaptive_constraints_n, 65609162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr, 65619162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr, 656208122e43SStefano Zampini pcbddc->adaptive_constraints_idxs, 656308122e43SStefano Zampini pcbddc->adaptive_constraints_data);CHKERRQ(ierr); 65649162d606SStefano Zampini ierr = PetscFree(constraints_n);CHKERRQ(ierr); 65659162d606SStefano Zampini ierr = PetscFree(constraints_idxs_B);CHKERRQ(ierr); 656608122e43SStefano Zampini } 6567674ae819SStefano Zampini PetscFunctionReturn(0); 6568674ae819SStefano Zampini } 6569674ae819SStefano Zampini 6570674ae819SStefano Zampini PetscErrorCode PCBDDCAnalyzeInterface(PC pc) 6571674ae819SStefano Zampini { 657271582508SStefano Zampini ISLocalToGlobalMapping map; 6573674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 6574674ae819SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 657566da6bd7Sstefano_zampini PetscInt i,N; 657666da6bd7Sstefano_zampini PetscBool rcsr = PETSC_FALSE; 657766da6bd7Sstefano_zampini PetscErrorCode ierr; 6578674ae819SStefano Zampini 6579674ae819SStefano Zampini PetscFunctionBegin; 65808af8fcf9SStefano Zampini if (pcbddc->recompute_topography) { 6581b03ebc13SStefano Zampini pcbddc->graphanalyzed = PETSC_FALSE; 65828e61c736SStefano Zampini /* Reset previously computed graph */ 65838e61c736SStefano Zampini ierr = PCBDDCGraphReset(pcbddc->mat_graph);CHKERRQ(ierr); 6584674ae819SStefano Zampini /* Init local Graph struct */ 65857fb0e2dbSStefano Zampini ierr = MatGetSize(pc->pmat,&N,NULL);CHKERRQ(ierr); 658671582508SStefano Zampini ierr = MatGetLocalToGlobalMapping(pc->pmat,&map,NULL);CHKERRQ(ierr); 6587be12c134Sstefano_zampini ierr = PCBDDCGraphInit(pcbddc->mat_graph,map,N,pcbddc->graphmaxcount);CHKERRQ(ierr); 6588674ae819SStefano Zampini 65897a0e7b2cSstefano_zampini if (pcbddc->user_primal_vertices_local && !pcbddc->user_primal_vertices) { 65907a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LOR,&pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 65917a0e7b2cSstefano_zampini } 6592575ad6abSStefano Zampini /* Check validity of the csr graph passed in by the user */ 65939a962809SStefano Zampini if (pcbddc->mat_graph->nvtxs_csr && pcbddc->mat_graph->nvtxs_csr != pcbddc->mat_graph->nvtxs) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Invalid size of local CSR graph! Found %d, expected %d\n",pcbddc->mat_graph->nvtxs_csr,pcbddc->mat_graph->nvtxs); 65949577ea80SStefano Zampini 6595674ae819SStefano Zampini /* Set default CSR adjacency of local dofs if not provided by the user with PCBDDCSetLocalAdjacencyGraph */ 659666da6bd7Sstefano_zampini if (!pcbddc->mat_graph->xadj && pcbddc->use_local_adj) { 65974d379d7bSStefano Zampini PetscInt *xadj,*adjncy; 65984d379d7bSStefano Zampini PetscInt nvtxs; 6599e496cd5dSStefano Zampini PetscBool flg_row=PETSC_FALSE; 6600674ae819SStefano Zampini 66012fffb893SStefano Zampini ierr = MatGetRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 66022fffb893SStefano Zampini if (flg_row) { 66034d379d7bSStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 6604b96c3477SStefano Zampini pcbddc->computed_rowadj = PETSC_TRUE; 66052fffb893SStefano Zampini } 66062fffb893SStefano Zampini ierr = MatRestoreRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 660766da6bd7Sstefano_zampini rcsr = PETSC_TRUE; 6608674ae819SStefano Zampini } 66099b28b941SStefano Zampini if (pcbddc->dbg_flag) { 66109b28b941SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 6611674ae819SStefano Zampini } 6612674ae819SStefano Zampini 6613674ae819SStefano Zampini /* Setup of Graph */ 66144b2aedd3SStefano Zampini pcbddc->mat_graph->commsizelimit = 0; /* don't use the COMM_SELF variant of the graph */ 661514f95afaSStefano Zampini ierr = PCBDDCGraphSetUp(pcbddc->mat_graph,pcbddc->vertex_size,pcbddc->NeumannBoundariesLocal,pcbddc->DirichletBoundariesLocal,pcbddc->n_ISForDofsLocal,pcbddc->ISForDofsLocal,pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 6616674ae819SStefano Zampini 66174f1b2e48SStefano Zampini /* attach info on disconnected subdomains if present */ 66184f1b2e48SStefano Zampini if (pcbddc->n_local_subs) { 66194f1b2e48SStefano Zampini PetscInt *local_subs; 66204f1b2e48SStefano Zampini 66214f1b2e48SStefano Zampini ierr = PetscMalloc1(N,&local_subs);CHKERRQ(ierr); 66224f1b2e48SStefano Zampini for (i=0;i<pcbddc->n_local_subs;i++) { 66234f1b2e48SStefano Zampini const PetscInt *idxs; 66244f1b2e48SStefano Zampini PetscInt nl,j; 66254f1b2e48SStefano Zampini 66264f1b2e48SStefano Zampini ierr = ISGetLocalSize(pcbddc->local_subs[i],&nl);CHKERRQ(ierr); 66274f1b2e48SStefano Zampini ierr = ISGetIndices(pcbddc->local_subs[i],&idxs);CHKERRQ(ierr); 662871582508SStefano Zampini for (j=0;j<nl;j++) local_subs[idxs[j]] = i; 66294f1b2e48SStefano Zampini ierr = ISRestoreIndices(pcbddc->local_subs[i],&idxs);CHKERRQ(ierr); 66304f1b2e48SStefano Zampini } 66314f1b2e48SStefano Zampini pcbddc->mat_graph->n_local_subs = pcbddc->n_local_subs; 66324f1b2e48SStefano Zampini pcbddc->mat_graph->local_subs = local_subs; 66334f1b2e48SStefano Zampini } 66348af8fcf9SStefano Zampini } 66354f1b2e48SStefano Zampini 6636cac5312eSStefano Zampini if (!pcbddc->graphanalyzed) { 6637674ae819SStefano Zampini /* Graph's connected components analysis */ 6638674ae819SStefano Zampini ierr = PCBDDCGraphComputeConnectedComponents(pcbddc->mat_graph);CHKERRQ(ierr); 663971582508SStefano Zampini pcbddc->graphanalyzed = PETSC_TRUE; 66408af8fcf9SStefano Zampini } 664166da6bd7Sstefano_zampini if (rcsr) pcbddc->mat_graph->nvtxs_csr = 0; 6642674ae819SStefano Zampini PetscFunctionReturn(0); 6643674ae819SStefano Zampini } 6644674ae819SStefano Zampini 66459a7d3425SStefano Zampini PetscErrorCode PCBDDCOrthonormalizeVecs(PetscInt n, Vec vecs[]) 66469a7d3425SStefano Zampini { 66479a7d3425SStefano Zampini PetscInt i,j; 66489a7d3425SStefano Zampini PetscScalar *alphas; 66499a7d3425SStefano Zampini PetscErrorCode ierr; 66509a7d3425SStefano Zampini 66519a7d3425SStefano Zampini PetscFunctionBegin; 6652785e854fSJed Brown ierr = PetscMalloc1(n,&alphas);CHKERRQ(ierr); 66539a7d3425SStefano Zampini for (i=0;i<n;i++) { 66549a7d3425SStefano Zampini ierr = VecNormalize(vecs[i],NULL);CHKERRQ(ierr); 6655669cc0f4SStefano Zampini ierr = VecMDot(vecs[i],n-i-1,&vecs[i+1],alphas);CHKERRQ(ierr); 6656669cc0f4SStefano Zampini for (j=0;j<n-i-1;j++) alphas[j] = PetscConj(-alphas[j]); 6657669cc0f4SStefano Zampini ierr = VecMAXPY(vecs[j],n-i-1,alphas,vecs+i);CHKERRQ(ierr); 66589a7d3425SStefano Zampini } 66599a7d3425SStefano Zampini ierr = PetscFree(alphas);CHKERRQ(ierr); 66609a7d3425SStefano Zampini PetscFunctionReturn(0); 66619a7d3425SStefano Zampini } 66629a7d3425SStefano Zampini 6663bb360cb4SStefano Zampini PetscErrorCode PCBDDCMatISGetSubassemblingPattern(Mat mat, PetscInt *n_subdomains, PetscInt redprocs, IS* is_sends, PetscBool *have_void) 6664e7931f94SStefano Zampini { 666557de7509SStefano Zampini Mat A; 6666e7931f94SStefano Zampini PetscInt n_neighs,*neighs,*n_shared,**shared; 6667e7931f94SStefano Zampini PetscMPIInt size,rank,color; 666852e5ac9dSStefano Zampini PetscInt *xadj,*adjncy; 666952e5ac9dSStefano Zampini PetscInt *adjncy_wgt,*v_wgt,*ranks_send_to_idx; 6670bb360cb4SStefano Zampini PetscInt im_active,active_procs,N,n,i,j,threshold = 2; 667157de7509SStefano Zampini PetscInt void_procs,*procs_candidates = NULL; 667227b6a85dSStefano Zampini PetscInt xadj_count,*count; 667327b6a85dSStefano Zampini PetscBool ismatis,use_vwgt=PETSC_FALSE; 667427b6a85dSStefano Zampini PetscSubcomm psubcomm; 667527b6a85dSStefano Zampini MPI_Comm subcomm; 667652e5ac9dSStefano Zampini PetscErrorCode ierr; 6677a57a6d2fSStefano Zampini 6678e7931f94SStefano Zampini PetscFunctionBegin; 667957de7509SStefano Zampini PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 668057de7509SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)mat,MATIS,&ismatis);CHKERRQ(ierr); 6681fbfcfee5SBarry Smith if (!ismatis) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot use %s on a matrix object which is not of type MATIS",PETSC_FUNCTION_NAME); 668257de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,*n_subdomains,2); 668357de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,redprocs,3); 668457de7509SStefano Zampini if (*n_subdomains <=0) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_WRONG,"Invalid number of subdomains requested %d\n",*n_subdomains); 668557de7509SStefano Zampini 668657de7509SStefano Zampini if (have_void) *have_void = PETSC_FALSE; 668757de7509SStefano Zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)mat),&size);CHKERRQ(ierr); 668857de7509SStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)mat),&rank);CHKERRQ(ierr); 668957de7509SStefano Zampini ierr = MatISGetLocalMat(mat,&A);CHKERRQ(ierr); 669057de7509SStefano Zampini ierr = MatGetLocalSize(A,&n,NULL);CHKERRQ(ierr); 6691bb360cb4SStefano Zampini im_active = !!n; 669257de7509SStefano Zampini ierr = MPIU_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr); 669357de7509SStefano Zampini void_procs = size - active_procs; 669457de7509SStefano Zampini /* get ranks of of non-active processes in mat communicator */ 669557de7509SStefano Zampini if (void_procs) { 669657de7509SStefano Zampini PetscInt ncand; 669757de7509SStefano Zampini 669857de7509SStefano Zampini if (have_void) *have_void = PETSC_TRUE; 669957de7509SStefano Zampini ierr = PetscMalloc1(size,&procs_candidates);CHKERRQ(ierr); 670057de7509SStefano Zampini ierr = MPI_Allgather(&im_active,1,MPIU_INT,procs_candidates,1,MPIU_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr); 670157de7509SStefano Zampini for (i=0,ncand=0;i<size;i++) { 670257de7509SStefano Zampini if (!procs_candidates[i]) { 670357de7509SStefano Zampini procs_candidates[ncand++] = i; 670457de7509SStefano Zampini } 670557de7509SStefano Zampini } 670657de7509SStefano Zampini /* force n_subdomains to be not greater that the number of non-active processes */ 670757de7509SStefano Zampini *n_subdomains = PetscMin(void_procs,*n_subdomains); 670857de7509SStefano Zampini } 670957de7509SStefano Zampini 6710bb360cb4SStefano Zampini /* number of subdomains requested greater than active processes or matrix size -> just shift the matrix 671114f0bfb9SStefano Zampini number of subdomains requested 1 -> send to master or first candidate in voids */ 6712bb360cb4SStefano Zampini ierr = MatGetSize(mat,&N,NULL);CHKERRQ(ierr); 6713bb360cb4SStefano Zampini if (active_procs < *n_subdomains || *n_subdomains == 1 || N <= *n_subdomains) { 671414f0bfb9SStefano Zampini PetscInt issize,isidx,dest; 671514f0bfb9SStefano Zampini if (*n_subdomains == 1) dest = 0; 671614f0bfb9SStefano Zampini else dest = rank; 671757de7509SStefano Zampini if (im_active) { 671857de7509SStefano Zampini issize = 1; 671957de7509SStefano Zampini if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */ 672014f0bfb9SStefano Zampini isidx = procs_candidates[dest]; 672157de7509SStefano Zampini } else { 672214f0bfb9SStefano Zampini isidx = dest; 672357de7509SStefano Zampini } 672457de7509SStefano Zampini } else { 672557de7509SStefano Zampini issize = 0; 672657de7509SStefano Zampini isidx = -1; 672757de7509SStefano Zampini } 6728bb360cb4SStefano Zampini if (*n_subdomains != 1) *n_subdomains = active_procs; 672957de7509SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)mat),issize,&isidx,PETSC_COPY_VALUES,is_sends);CHKERRQ(ierr); 6730daf8a457SStefano Zampini ierr = PetscFree(procs_candidates);CHKERRQ(ierr); 673157de7509SStefano Zampini PetscFunctionReturn(0); 673257de7509SStefano Zampini } 6733c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-matis_partitioning_use_vwgt",&use_vwgt,NULL);CHKERRQ(ierr); 6734c5929fdfSBarry Smith ierr = PetscOptionsGetInt(NULL,NULL,"-matis_partitioning_threshold",&threshold,NULL);CHKERRQ(ierr); 673527b6a85dSStefano Zampini threshold = PetscMax(threshold,2); 6736e7931f94SStefano Zampini 6737e7931f94SStefano Zampini /* Get info on mapping */ 67383bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(mat->rmap->mapping,&n_neighs,&neighs,&n_shared,&shared);CHKERRQ(ierr); 6739e7931f94SStefano Zampini 6740e7931f94SStefano Zampini /* build local CSR graph of subdomains' connectivity */ 6741785e854fSJed Brown ierr = PetscMalloc1(2,&xadj);CHKERRQ(ierr); 6742e7931f94SStefano Zampini xadj[0] = 0; 6743e7931f94SStefano Zampini xadj[1] = PetscMax(n_neighs-1,0); 6744785e854fSJed Brown ierr = PetscMalloc1(xadj[1],&adjncy);CHKERRQ(ierr); 6745785e854fSJed Brown ierr = PetscMalloc1(xadj[1],&adjncy_wgt);CHKERRQ(ierr); 6746bb360cb4SStefano Zampini ierr = PetscCalloc1(n,&count);CHKERRQ(ierr); 674727b6a85dSStefano Zampini for (i=1;i<n_neighs;i++) 674827b6a85dSStefano Zampini for (j=0;j<n_shared[i];j++) 674927b6a85dSStefano Zampini count[shared[i][j]] += 1; 6750e7931f94SStefano Zampini 675127b6a85dSStefano Zampini xadj_count = 0; 67522b510759SStefano Zampini for (i=1;i<n_neighs;i++) { 675327b6a85dSStefano Zampini for (j=0;j<n_shared[i];j++) { 675427b6a85dSStefano Zampini if (count[shared[i][j]] < threshold) { 6755d023bfaeSStefano Zampini adjncy[xadj_count] = neighs[i]; 6756d023bfaeSStefano Zampini adjncy_wgt[xadj_count] = n_shared[i]; 6757d023bfaeSStefano Zampini xadj_count++; 675827b6a85dSStefano Zampini break; 675927b6a85dSStefano Zampini } 6760e7931f94SStefano Zampini } 6761e7931f94SStefano Zampini } 6762d023bfaeSStefano Zampini xadj[1] = xadj_count; 676327b6a85dSStefano Zampini ierr = PetscFree(count);CHKERRQ(ierr); 67643bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(mat->rmap->mapping,&n_neighs,&neighs,&n_shared,&shared);CHKERRQ(ierr); 6765e7931f94SStefano Zampini ierr = PetscSortIntWithArray(xadj[1],adjncy,adjncy_wgt);CHKERRQ(ierr); 6766e7931f94SStefano Zampini 67673837a79fSStefano Zampini ierr = PetscMalloc1(1,&ranks_send_to_idx);CHKERRQ(ierr); 6768e7931f94SStefano Zampini 676927b6a85dSStefano Zampini /* Restrict work on active processes only */ 677027b6a85dSStefano Zampini ierr = PetscMPIIntCast(im_active,&color);CHKERRQ(ierr); 677127b6a85dSStefano Zampini if (void_procs) { 677227b6a85dSStefano Zampini ierr = PetscSubcommCreate(PetscObjectComm((PetscObject)mat),&psubcomm);CHKERRQ(ierr); 677327b6a85dSStefano Zampini ierr = PetscSubcommSetNumber(psubcomm,2);CHKERRQ(ierr); /* 2 groups, active process and not active processes */ 677427b6a85dSStefano Zampini ierr = PetscSubcommSetTypeGeneral(psubcomm,color,rank);CHKERRQ(ierr); 677527b6a85dSStefano Zampini subcomm = PetscSubcommChild(psubcomm); 677627b6a85dSStefano Zampini } else { 677727b6a85dSStefano Zampini psubcomm = NULL; 677827b6a85dSStefano Zampini subcomm = PetscObjectComm((PetscObject)mat); 677927b6a85dSStefano Zampini } 678027b6a85dSStefano Zampini 678127b6a85dSStefano Zampini v_wgt = NULL; 678227b6a85dSStefano Zampini if (!color) { 6783e7931f94SStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 6784e7931f94SStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 6785e7931f94SStefano Zampini ierr = PetscFree(adjncy_wgt);CHKERRQ(ierr); 6786c8587f34SStefano Zampini } else { 678752e5ac9dSStefano Zampini Mat subdomain_adj; 678852e5ac9dSStefano Zampini IS new_ranks,new_ranks_contig; 678952e5ac9dSStefano Zampini MatPartitioning partitioner; 679027b6a85dSStefano Zampini PetscInt rstart=0,rend=0; 679152e5ac9dSStefano Zampini PetscInt *is_indices,*oldranks; 679257de7509SStefano Zampini PetscMPIInt size; 6793b0c7d250SStefano Zampini PetscBool aggregate; 6794b0c7d250SStefano Zampini 679527b6a85dSStefano Zampini ierr = MPI_Comm_size(subcomm,&size);CHKERRQ(ierr); 679627b6a85dSStefano Zampini if (void_procs) { 679727b6a85dSStefano Zampini PetscInt prank = rank; 6798785e854fSJed Brown ierr = PetscMalloc1(size,&oldranks);CHKERRQ(ierr); 679927b6a85dSStefano Zampini ierr = MPI_Allgather(&prank,1,MPIU_INT,oldranks,1,MPIU_INT,subcomm);CHKERRQ(ierr); 6800e7931f94SStefano Zampini for (i=0;i<xadj[1];i++) { 6801e7931f94SStefano Zampini ierr = PetscFindInt(adjncy[i],size,oldranks,&adjncy[i]);CHKERRQ(ierr); 6802c8587f34SStefano Zampini } 6803e7931f94SStefano Zampini ierr = PetscSortIntWithArray(xadj[1],adjncy,adjncy_wgt);CHKERRQ(ierr); 680427b6a85dSStefano Zampini } else { 680527b6a85dSStefano Zampini oldranks = NULL; 680627b6a85dSStefano Zampini } 6807b0c7d250SStefano Zampini aggregate = ((redprocs > 0 && redprocs < size) ? PETSC_TRUE : PETSC_FALSE); 680827b6a85dSStefano Zampini if (aggregate) { /* TODO: all this part could be made more efficient */ 6809b0c7d250SStefano Zampini PetscInt lrows,row,ncols,*cols; 6810b0c7d250SStefano Zampini PetscMPIInt nrank; 6811b0c7d250SStefano Zampini PetscScalar *vals; 6812b0c7d250SStefano Zampini 681327b6a85dSStefano Zampini ierr = MPI_Comm_rank(subcomm,&nrank);CHKERRQ(ierr); 6814b0c7d250SStefano Zampini lrows = 0; 6815b0c7d250SStefano Zampini if (nrank<redprocs) { 6816b0c7d250SStefano Zampini lrows = size/redprocs; 6817b0c7d250SStefano Zampini if (nrank<size%redprocs) lrows++; 6818b0c7d250SStefano Zampini } 681927b6a85dSStefano Zampini ierr = MatCreateAIJ(subcomm,lrows,lrows,size,size,50,NULL,50,NULL,&subdomain_adj);CHKERRQ(ierr); 6820b0c7d250SStefano Zampini ierr = MatGetOwnershipRange(subdomain_adj,&rstart,&rend);CHKERRQ(ierr); 6821b0c7d250SStefano Zampini ierr = MatSetOption(subdomain_adj,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 6822b0c7d250SStefano Zampini ierr = MatSetOption(subdomain_adj,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 6823b0c7d250SStefano Zampini row = nrank; 6824b0c7d250SStefano Zampini ncols = xadj[1]-xadj[0]; 6825b0c7d250SStefano Zampini cols = adjncy; 6826b0c7d250SStefano Zampini ierr = PetscMalloc1(ncols,&vals);CHKERRQ(ierr); 6827b0c7d250SStefano Zampini for (i=0;i<ncols;i++) vals[i] = adjncy_wgt[i]; 6828b0c7d250SStefano Zampini ierr = MatSetValues(subdomain_adj,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 6829b0c7d250SStefano Zampini ierr = MatAssemblyBegin(subdomain_adj,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6830b0c7d250SStefano Zampini ierr = MatAssemblyEnd(subdomain_adj,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 683152e5ac9dSStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 683252e5ac9dSStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 683352e5ac9dSStefano Zampini ierr = PetscFree(adjncy_wgt);CHKERRQ(ierr); 6834b0c7d250SStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 683527b6a85dSStefano Zampini if (use_vwgt) { 683627b6a85dSStefano Zampini Vec v; 683727b6a85dSStefano Zampini const PetscScalar *array; 683827b6a85dSStefano Zampini PetscInt nl; 683927b6a85dSStefano Zampini 684027b6a85dSStefano Zampini ierr = MatCreateVecs(subdomain_adj,&v,NULL);CHKERRQ(ierr); 6841bb360cb4SStefano Zampini ierr = VecSetValue(v,row,(PetscScalar)n,INSERT_VALUES);CHKERRQ(ierr); 684227b6a85dSStefano Zampini ierr = VecAssemblyBegin(v);CHKERRQ(ierr); 684327b6a85dSStefano Zampini ierr = VecAssemblyEnd(v);CHKERRQ(ierr); 684427b6a85dSStefano Zampini ierr = VecGetLocalSize(v,&nl);CHKERRQ(ierr); 684527b6a85dSStefano Zampini ierr = VecGetArrayRead(v,&array);CHKERRQ(ierr); 684627b6a85dSStefano Zampini ierr = PetscMalloc1(nl,&v_wgt);CHKERRQ(ierr); 684722db5ddcSStefano Zampini for (i=0;i<nl;i++) v_wgt[i] = (PetscInt)PetscRealPart(array[i]); 684827b6a85dSStefano Zampini ierr = VecRestoreArrayRead(v,&array);CHKERRQ(ierr); 684927b6a85dSStefano Zampini ierr = VecDestroy(&v);CHKERRQ(ierr); 685027b6a85dSStefano Zampini } 6851b0c7d250SStefano Zampini } else { 685227b6a85dSStefano Zampini ierr = MatCreateMPIAdj(subcomm,1,(PetscInt)size,xadj,adjncy,adjncy_wgt,&subdomain_adj);CHKERRQ(ierr); 685327b6a85dSStefano Zampini if (use_vwgt) { 685427b6a85dSStefano Zampini ierr = PetscMalloc1(1,&v_wgt);CHKERRQ(ierr); 6855bb360cb4SStefano Zampini v_wgt[0] = n; 685627b6a85dSStefano Zampini } 6857b0c7d250SStefano Zampini } 685822b6e8a2SStefano Zampini /* ierr = MatView(subdomain_adj,0);CHKERRQ(ierr); */ 6859e7931f94SStefano Zampini 6860e7931f94SStefano Zampini /* Partition */ 686127b6a85dSStefano Zampini ierr = MatPartitioningCreate(subcomm,&partitioner);CHKERRQ(ierr); 6862e7931f94SStefano Zampini ierr = MatPartitioningSetAdjacency(partitioner,subdomain_adj);CHKERRQ(ierr); 686327b6a85dSStefano Zampini if (v_wgt) { 6864e7931f94SStefano Zampini ierr = MatPartitioningSetVertexWeights(partitioner,v_wgt);CHKERRQ(ierr); 6865c8587f34SStefano Zampini } 686657de7509SStefano Zampini *n_subdomains = PetscMin((PetscInt)size,*n_subdomains); 686757de7509SStefano Zampini ierr = MatPartitioningSetNParts(partitioner,*n_subdomains);CHKERRQ(ierr); 6868e7931f94SStefano Zampini ierr = MatPartitioningSetFromOptions(partitioner);CHKERRQ(ierr); 6869e7931f94SStefano Zampini ierr = MatPartitioningApply(partitioner,&new_ranks);CHKERRQ(ierr); 687022b6e8a2SStefano Zampini /* ierr = MatPartitioningView(partitioner,0);CHKERRQ(ierr); */ 6871e7931f94SStefano Zampini 687252e5ac9dSStefano Zampini /* renumber new_ranks to avoid "holes" in new set of processors */ 68736583bcc1SStefano Zampini ierr = ISRenumber(new_ranks,NULL,NULL,&new_ranks_contig);CHKERRQ(ierr); 687452e5ac9dSStefano Zampini ierr = ISDestroy(&new_ranks);CHKERRQ(ierr); 687552e5ac9dSStefano Zampini ierr = ISGetIndices(new_ranks_contig,(const PetscInt**)&is_indices);CHKERRQ(ierr); 687657de7509SStefano Zampini if (!aggregate) { 687757de7509SStefano Zampini if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */ 687827b6a85dSStefano Zampini #if defined(PETSC_USE_DEBUG) 687927b6a85dSStefano Zampini if (!oldranks) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen"); 688027b6a85dSStefano Zampini #endif 688157de7509SStefano Zampini ranks_send_to_idx[0] = procs_candidates[oldranks[is_indices[0]]]; 688227b6a85dSStefano Zampini } else if (oldranks) { 6883b0c7d250SStefano Zampini ranks_send_to_idx[0] = oldranks[is_indices[0]]; 688427b6a85dSStefano Zampini } else { 688527b6a85dSStefano Zampini ranks_send_to_idx[0] = is_indices[0]; 688657de7509SStefano Zampini } 688728143c3dSStefano Zampini } else { 68887fb8a5e4SKarl Rupp PetscInt idx = 0; 6889b0c7d250SStefano Zampini PetscMPIInt tag; 6890b0c7d250SStefano Zampini MPI_Request *reqs; 6891b0c7d250SStefano Zampini 6892b0c7d250SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)subdomain_adj,&tag);CHKERRQ(ierr); 6893b0c7d250SStefano Zampini ierr = PetscMalloc1(rend-rstart,&reqs);CHKERRQ(ierr); 6894b0c7d250SStefano Zampini for (i=rstart;i<rend;i++) { 689527b6a85dSStefano Zampini ierr = MPI_Isend(is_indices+i-rstart,1,MPIU_INT,i,tag,subcomm,&reqs[i-rstart]);CHKERRQ(ierr); 689628143c3dSStefano Zampini } 68977fb8a5e4SKarl Rupp ierr = MPI_Recv(&idx,1,MPIU_INT,MPI_ANY_SOURCE,tag,subcomm,MPI_STATUS_IGNORE);CHKERRQ(ierr); 6898b0c7d250SStefano Zampini ierr = MPI_Waitall(rend-rstart,reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 6899b0c7d250SStefano Zampini ierr = PetscFree(reqs);CHKERRQ(ierr); 690057de7509SStefano Zampini if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */ 690127b6a85dSStefano Zampini #if defined(PETSC_USE_DEBUG) 690227b6a85dSStefano Zampini if (!oldranks) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen"); 690327b6a85dSStefano Zampini #endif 69047fb8a5e4SKarl Rupp ranks_send_to_idx[0] = procs_candidates[oldranks[idx]]; 690527b6a85dSStefano Zampini } else if (oldranks) { 69067fb8a5e4SKarl Rupp ranks_send_to_idx[0] = oldranks[idx]; 690727b6a85dSStefano Zampini } else { 69087fb8a5e4SKarl Rupp ranks_send_to_idx[0] = idx; 6909e7931f94SStefano Zampini } 691057de7509SStefano Zampini } 691152e5ac9dSStefano Zampini ierr = ISRestoreIndices(new_ranks_contig,(const PetscInt**)&is_indices);CHKERRQ(ierr); 6912e7931f94SStefano Zampini /* clean up */ 6913e7931f94SStefano Zampini ierr = PetscFree(oldranks);CHKERRQ(ierr); 691452e5ac9dSStefano Zampini ierr = ISDestroy(&new_ranks_contig);CHKERRQ(ierr); 6915e7931f94SStefano Zampini ierr = MatDestroy(&subdomain_adj);CHKERRQ(ierr); 6916e7931f94SStefano Zampini ierr = MatPartitioningDestroy(&partitioner);CHKERRQ(ierr); 6917e7931f94SStefano Zampini } 691827b6a85dSStefano Zampini ierr = PetscSubcommDestroy(&psubcomm);CHKERRQ(ierr); 691957de7509SStefano Zampini ierr = PetscFree(procs_candidates);CHKERRQ(ierr); 6920e7931f94SStefano Zampini 6921e7931f94SStefano Zampini /* assemble parallel IS for sends */ 6922e7931f94SStefano Zampini i = 1; 692327b6a85dSStefano Zampini if (!color) i=0; 692457de7509SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)mat),i,ranks_send_to_idx,PETSC_OWN_POINTER,is_sends);CHKERRQ(ierr); 6925e7931f94SStefano Zampini PetscFunctionReturn(0); 6926e7931f94SStefano Zampini } 6927e7931f94SStefano Zampini 6928e7931f94SStefano Zampini typedef enum {MATDENSE_PRIVATE=0,MATAIJ_PRIVATE,MATBAIJ_PRIVATE,MATSBAIJ_PRIVATE}MatTypePrivate; 6929e7931f94SStefano Zampini 69301e0482f5SStefano Zampini PetscErrorCode PCBDDCMatISSubassemble(Mat mat, IS is_sends, PetscInt n_subdomains, PetscBool restrict_comm, PetscBool restrict_full, PetscBool reuse, Mat *mat_n, PetscInt nis, IS isarray[], PetscInt nvecs, Vec nnsp_vec[]) 6931e7931f94SStefano Zampini { 693270cf5478SStefano Zampini Mat local_mat; 6933e7931f94SStefano Zampini IS is_sends_internal; 69349d30be91SStefano Zampini PetscInt rows,cols,new_local_rows; 69351ae86dd6SStefano Zampini PetscInt i,bs,buf_size_idxs,buf_size_idxs_is,buf_size_vals,buf_size_vecs; 69369d30be91SStefano Zampini PetscBool ismatis,isdense,newisdense,destroy_mat; 6937e7931f94SStefano Zampini ISLocalToGlobalMapping l2gmap; 6938e7931f94SStefano Zampini PetscInt* l2gmap_indices; 6939e7931f94SStefano Zampini const PetscInt* is_indices; 6940e7931f94SStefano Zampini MatType new_local_type; 6941e7931f94SStefano Zampini /* buffers */ 6942e7931f94SStefano Zampini PetscInt *ptr_idxs,*send_buffer_idxs,*recv_buffer_idxs; 694328143c3dSStefano Zampini PetscInt *ptr_idxs_is,*send_buffer_idxs_is,*recv_buffer_idxs_is; 69449d30be91SStefano Zampini PetscInt *recv_buffer_idxs_local; 6945e7931f94SStefano Zampini PetscScalar *ptr_vals,*send_buffer_vals,*recv_buffer_vals; 69461ae86dd6SStefano Zampini PetscScalar *ptr_vecs,*send_buffer_vecs,*recv_buffer_vecs; 6947e7931f94SStefano Zampini /* MPI */ 694828143c3dSStefano Zampini MPI_Comm comm,comm_n; 694928143c3dSStefano Zampini PetscSubcomm subcomm; 6950e7931f94SStefano Zampini PetscMPIInt n_sends,n_recvs,commsize; 695128143c3dSStefano Zampini PetscMPIInt *iflags,*ilengths_idxs,*ilengths_vals,*ilengths_idxs_is; 695228143c3dSStefano Zampini PetscMPIInt *onodes,*onodes_is,*olengths_idxs,*olengths_idxs_is,*olengths_vals; 69531ae86dd6SStefano Zampini PetscMPIInt len,tag_idxs,tag_idxs_is,tag_vals,tag_vecs,source_dest; 69541ae86dd6SStefano Zampini MPI_Request *send_req_idxs,*send_req_idxs_is,*send_req_vals,*send_req_vecs; 69551ae86dd6SStefano Zampini MPI_Request *recv_req_idxs,*recv_req_idxs_is,*recv_req_vals,*recv_req_vecs; 6956e7931f94SStefano Zampini PetscErrorCode ierr; 6957e7931f94SStefano Zampini 6958e7931f94SStefano Zampini PetscFunctionBegin; 695957de7509SStefano Zampini PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 6960e7931f94SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)mat,MATIS,&ismatis);CHKERRQ(ierr); 6961fbfcfee5SBarry Smith if (!ismatis) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot use %s on a matrix object which is not of type MATIS",PETSC_FUNCTION_NAME); 696257de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,n_subdomains,3); 696357de7509SStefano Zampini PetscValidLogicalCollectiveBool(mat,restrict_comm,4); 696457de7509SStefano Zampini PetscValidLogicalCollectiveBool(mat,restrict_full,5); 696557de7509SStefano Zampini PetscValidLogicalCollectiveBool(mat,reuse,6); 696657de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,nis,8); 69671ae86dd6SStefano Zampini PetscValidLogicalCollectiveInt(mat,nvecs,10); 69681ae86dd6SStefano Zampini if (nvecs) { 69691ae86dd6SStefano Zampini if (nvecs > 1) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Just 1 vector supported"); 69701ae86dd6SStefano Zampini PetscValidHeaderSpecific(nnsp_vec[0],VEC_CLASSID,11); 69711ae86dd6SStefano Zampini } 697257de7509SStefano Zampini /* further checks */ 6973e7931f94SStefano Zampini ierr = MatISGetLocalMat(mat,&local_mat);CHKERRQ(ierr); 6974e7931f94SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)local_mat,MATSEQDENSE,&isdense);CHKERRQ(ierr); 6975e7931f94SStefano Zampini if (!isdense) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Currently cannot subassemble MATIS when local matrix type is not of type SEQDENSE"); 6976e7931f94SStefano Zampini ierr = MatGetSize(local_mat,&rows,&cols);CHKERRQ(ierr); 6977e7931f94SStefano Zampini if (rows != cols) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Local MATIS matrices should be square"); 697857de7509SStefano Zampini if (reuse && *mat_n) { 697970cf5478SStefano Zampini PetscInt mrows,mcols,mnrows,mncols; 698057de7509SStefano Zampini PetscValidHeaderSpecific(*mat_n,MAT_CLASSID,7); 698170cf5478SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)*mat_n,MATIS,&ismatis);CHKERRQ(ierr); 698228143c3dSStefano Zampini if (!ismatis) SETERRQ(PetscObjectComm((PetscObject)*mat_n),PETSC_ERR_SUP,"Cannot reuse a matrix which is not of type MATIS"); 698370cf5478SStefano Zampini ierr = MatGetSize(mat,&mrows,&mcols);CHKERRQ(ierr); 698470cf5478SStefano Zampini ierr = MatGetSize(*mat_n,&mnrows,&mncols);CHKERRQ(ierr); 698570cf5478SStefano Zampini if (mrows != mnrows) SETERRQ2(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot reuse matrix! Wrong number of rows %D != %D",mrows,mnrows); 698670cf5478SStefano Zampini if (mcols != mncols) SETERRQ2(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot reuse matrix! Wrong number of cols %D != %D",mcols,mncols); 698770cf5478SStefano Zampini } 6988e7931f94SStefano Zampini ierr = MatGetBlockSize(local_mat,&bs);CHKERRQ(ierr); 6989e7931f94SStefano Zampini PetscValidLogicalCollectiveInt(mat,bs,0); 699057de7509SStefano Zampini 6991e7931f94SStefano Zampini /* prepare IS for sending if not provided */ 6992e7931f94SStefano Zampini if (!is_sends) { 699328143c3dSStefano Zampini if (!n_subdomains) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"You should specify either an IS or a target number of subdomains"); 6994bb360cb4SStefano Zampini ierr = PCBDDCMatISGetSubassemblingPattern(mat,&n_subdomains,0,&is_sends_internal,NULL);CHKERRQ(ierr); 6995c8587f34SStefano Zampini } else { 6996e7931f94SStefano Zampini ierr = PetscObjectReference((PetscObject)is_sends);CHKERRQ(ierr); 6997e7931f94SStefano Zampini is_sends_internal = is_sends; 6998c8587f34SStefano Zampini } 6999e7931f94SStefano Zampini 7000e7931f94SStefano Zampini /* get comm */ 7001a316fed8SStefano Zampini ierr = PetscObjectGetComm((PetscObject)mat,&comm);CHKERRQ(ierr); 7002e7931f94SStefano Zampini 7003e7931f94SStefano Zampini /* compute number of sends */ 7004e7931f94SStefano Zampini ierr = ISGetLocalSize(is_sends_internal,&i);CHKERRQ(ierr); 7005e7931f94SStefano Zampini ierr = PetscMPIIntCast(i,&n_sends);CHKERRQ(ierr); 7006e7931f94SStefano Zampini 7007e7931f94SStefano Zampini /* compute number of receives */ 7008e7931f94SStefano Zampini ierr = MPI_Comm_size(comm,&commsize);CHKERRQ(ierr); 7009785e854fSJed Brown ierr = PetscMalloc1(commsize,&iflags);CHKERRQ(ierr); 7010e7931f94SStefano Zampini ierr = PetscMemzero(iflags,commsize*sizeof(*iflags));CHKERRQ(ierr); 7011e7931f94SStefano Zampini ierr = ISGetIndices(is_sends_internal,&is_indices);CHKERRQ(ierr); 7012e7931f94SStefano Zampini for (i=0;i<n_sends;i++) iflags[is_indices[i]] = 1; 7013e7931f94SStefano Zampini ierr = PetscGatherNumberOfMessages(comm,iflags,NULL,&n_recvs);CHKERRQ(ierr); 7014e7931f94SStefano Zampini ierr = PetscFree(iflags);CHKERRQ(ierr); 7015e7931f94SStefano Zampini 701628143c3dSStefano Zampini /* restrict comm if requested */ 701728143c3dSStefano Zampini subcomm = 0; 701828143c3dSStefano Zampini destroy_mat = PETSC_FALSE; 701928143c3dSStefano Zampini if (restrict_comm) { 7020779c1cceSStefano Zampini PetscMPIInt color,subcommsize; 7021779c1cceSStefano Zampini 702228143c3dSStefano Zampini color = 0; 702353a05cb3SStefano Zampini if (restrict_full) { 702453a05cb3SStefano Zampini if (!n_recvs) color = 1; /* processes not receiving anything will not partecipate in new comm (full restriction) */ 702553a05cb3SStefano Zampini } else { 702653a05cb3SStefano Zampini if (!n_recvs && n_sends) color = 1; /* just those processes that are sending but not receiving anything will not partecipate in new comm */ 702753a05cb3SStefano Zampini } 7028b2566f29SBarry Smith ierr = MPIU_Allreduce(&color,&subcommsize,1,MPI_INT,MPI_SUM,comm);CHKERRQ(ierr); 702928143c3dSStefano Zampini subcommsize = commsize - subcommsize; 703028143c3dSStefano Zampini /* check if reuse has been requested */ 703157de7509SStefano Zampini if (reuse) { 703228143c3dSStefano Zampini if (*mat_n) { 703328143c3dSStefano Zampini PetscMPIInt subcommsize2; 703428143c3dSStefano Zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)*mat_n),&subcommsize2);CHKERRQ(ierr); 703528143c3dSStefano Zampini if (subcommsize != subcommsize2) SETERRQ2(PetscObjectComm((PetscObject)*mat_n),PETSC_ERR_PLIB,"Cannot reuse matrix! wrong subcomm size %d != %d",subcommsize,subcommsize2); 703628143c3dSStefano Zampini comm_n = PetscObjectComm((PetscObject)*mat_n); 703728143c3dSStefano Zampini } else { 703828143c3dSStefano Zampini comm_n = PETSC_COMM_SELF; 703928143c3dSStefano Zampini } 704028143c3dSStefano Zampini } else { /* MAT_INITIAL_MATRIX */ 7041779c1cceSStefano Zampini PetscMPIInt rank; 7042779c1cceSStefano Zampini 7043779c1cceSStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 704428143c3dSStefano Zampini ierr = PetscSubcommCreate(comm,&subcomm);CHKERRQ(ierr); 704528143c3dSStefano Zampini ierr = PetscSubcommSetNumber(subcomm,2);CHKERRQ(ierr); 704628143c3dSStefano Zampini ierr = PetscSubcommSetTypeGeneral(subcomm,color,rank);CHKERRQ(ierr); 7047306c2d5bSBarry Smith comm_n = PetscSubcommChild(subcomm); 704828143c3dSStefano Zampini } 704928143c3dSStefano Zampini /* flag to destroy *mat_n if not significative */ 705028143c3dSStefano Zampini if (color) destroy_mat = PETSC_TRUE; 705128143c3dSStefano Zampini } else { 705228143c3dSStefano Zampini comm_n = comm; 705328143c3dSStefano Zampini } 705428143c3dSStefano Zampini 7055e7931f94SStefano Zampini /* prepare send/receive buffers */ 7056785e854fSJed Brown ierr = PetscMalloc1(commsize,&ilengths_idxs);CHKERRQ(ierr); 7057e7931f94SStefano Zampini ierr = PetscMemzero(ilengths_idxs,commsize*sizeof(*ilengths_idxs));CHKERRQ(ierr); 7058785e854fSJed Brown ierr = PetscMalloc1(commsize,&ilengths_vals);CHKERRQ(ierr); 7059e7931f94SStefano Zampini ierr = PetscMemzero(ilengths_vals,commsize*sizeof(*ilengths_vals));CHKERRQ(ierr); 706028143c3dSStefano Zampini if (nis) { 7061854ce69bSBarry Smith ierr = PetscCalloc1(commsize,&ilengths_idxs_is);CHKERRQ(ierr); 706228143c3dSStefano Zampini } 7063e7931f94SStefano Zampini 706428143c3dSStefano Zampini /* Get data from local matrices */ 70656c4ed002SBarry Smith if (!isdense) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Subassembling of AIJ local matrices not yet implemented"); 7066e7931f94SStefano Zampini /* TODO: See below some guidelines on how to prepare the local buffers */ 7067e7931f94SStefano Zampini /* 7068e7931f94SStefano Zampini send_buffer_vals should contain the raw values of the local matrix 7069e7931f94SStefano Zampini send_buffer_idxs should contain: 7070e7931f94SStefano Zampini - MatType_PRIVATE type 7071e7931f94SStefano Zampini - PetscInt size_of_l2gmap 7072e7931f94SStefano Zampini - PetscInt global_row_indices[size_of_l2gmap] 7073e7931f94SStefano Zampini - PetscInt all_other_info_which_is_needed_to_compute_preallocation_and_set_values 7074e7931f94SStefano Zampini */ 70756c4ed002SBarry Smith else { 7076e7931f94SStefano Zampini ierr = MatDenseGetArray(local_mat,&send_buffer_vals);CHKERRQ(ierr); 70773bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingGetSize(mat->rmap->mapping,&i);CHKERRQ(ierr); 7078854ce69bSBarry Smith ierr = PetscMalloc1(i+2,&send_buffer_idxs);CHKERRQ(ierr); 7079e7931f94SStefano Zampini send_buffer_idxs[0] = (PetscInt)MATDENSE_PRIVATE; 7080e7931f94SStefano Zampini send_buffer_idxs[1] = i; 70813bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(mat->rmap->mapping,(const PetscInt**)&ptr_idxs);CHKERRQ(ierr); 7082e7931f94SStefano Zampini ierr = PetscMemcpy(&send_buffer_idxs[2],ptr_idxs,i*sizeof(PetscInt));CHKERRQ(ierr); 70833bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(mat->rmap->mapping,(const PetscInt**)&ptr_idxs);CHKERRQ(ierr); 7084e7931f94SStefano Zampini ierr = PetscMPIIntCast(i,&len);CHKERRQ(ierr); 7085e7931f94SStefano Zampini for (i=0;i<n_sends;i++) { 7086e7931f94SStefano Zampini ilengths_vals[is_indices[i]] = len*len; 7087e7931f94SStefano Zampini ilengths_idxs[is_indices[i]] = len+2; 7088c8587f34SStefano Zampini } 7089c8587f34SStefano Zampini } 7090e7931f94SStefano Zampini ierr = PetscGatherMessageLengths2(comm,n_sends,n_recvs,ilengths_idxs,ilengths_vals,&onodes,&olengths_idxs,&olengths_vals);CHKERRQ(ierr); 709128143c3dSStefano Zampini /* additional is (if any) */ 709228143c3dSStefano Zampini if (nis) { 709328143c3dSStefano Zampini PetscMPIInt psum; 709428143c3dSStefano Zampini PetscInt j; 709528143c3dSStefano Zampini for (j=0,psum=0;j<nis;j++) { 709628143c3dSStefano Zampini PetscInt plen; 709728143c3dSStefano Zampini ierr = ISGetLocalSize(isarray[j],&plen);CHKERRQ(ierr); 709828143c3dSStefano Zampini ierr = PetscMPIIntCast(plen,&len);CHKERRQ(ierr); 709928143c3dSStefano Zampini psum += len+1; /* indices + lenght */ 710028143c3dSStefano Zampini } 7101854ce69bSBarry Smith ierr = PetscMalloc1(psum,&send_buffer_idxs_is);CHKERRQ(ierr); 710228143c3dSStefano Zampini for (j=0,psum=0;j<nis;j++) { 710328143c3dSStefano Zampini PetscInt plen; 710428143c3dSStefano Zampini const PetscInt *is_array_idxs; 710528143c3dSStefano Zampini ierr = ISGetLocalSize(isarray[j],&plen);CHKERRQ(ierr); 710628143c3dSStefano Zampini send_buffer_idxs_is[psum] = plen; 710728143c3dSStefano Zampini ierr = ISGetIndices(isarray[j],&is_array_idxs);CHKERRQ(ierr); 710828143c3dSStefano Zampini ierr = PetscMemcpy(&send_buffer_idxs_is[psum+1],is_array_idxs,plen*sizeof(PetscInt));CHKERRQ(ierr); 710928143c3dSStefano Zampini ierr = ISRestoreIndices(isarray[j],&is_array_idxs);CHKERRQ(ierr); 711028143c3dSStefano Zampini psum += plen+1; /* indices + lenght */ 711128143c3dSStefano Zampini } 711228143c3dSStefano Zampini for (i=0;i<n_sends;i++) { 711328143c3dSStefano Zampini ilengths_idxs_is[is_indices[i]] = psum; 711428143c3dSStefano Zampini } 711528143c3dSStefano Zampini ierr = PetscGatherMessageLengths(comm,n_sends,n_recvs,ilengths_idxs_is,&onodes_is,&olengths_idxs_is);CHKERRQ(ierr); 711628143c3dSStefano Zampini } 71173b3b1effSJed Brown ierr = MatISRestoreLocalMat(mat,&local_mat);CHKERRQ(ierr); 711828143c3dSStefano Zampini 7119e7931f94SStefano Zampini buf_size_idxs = 0; 7120e7931f94SStefano Zampini buf_size_vals = 0; 712128143c3dSStefano Zampini buf_size_idxs_is = 0; 71221ae86dd6SStefano Zampini buf_size_vecs = 0; 7123e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7124e7931f94SStefano Zampini buf_size_idxs += (PetscInt)olengths_idxs[i]; 7125e7931f94SStefano Zampini buf_size_vals += (PetscInt)olengths_vals[i]; 712628143c3dSStefano Zampini if (nis) buf_size_idxs_is += (PetscInt)olengths_idxs_is[i]; 71271ae86dd6SStefano Zampini if (nvecs) buf_size_vecs += (PetscInt)olengths_idxs[i]; 7128e7931f94SStefano Zampini } 7129785e854fSJed Brown ierr = PetscMalloc1(buf_size_idxs,&recv_buffer_idxs);CHKERRQ(ierr); 7130785e854fSJed Brown ierr = PetscMalloc1(buf_size_vals,&recv_buffer_vals);CHKERRQ(ierr); 713195ecbf38SStefano Zampini ierr = PetscMalloc1(buf_size_idxs_is,&recv_buffer_idxs_is);CHKERRQ(ierr); 71321ae86dd6SStefano Zampini ierr = PetscMalloc1(buf_size_vecs,&recv_buffer_vecs);CHKERRQ(ierr); 7133e7931f94SStefano Zampini 7134e7931f94SStefano Zampini /* get new tags for clean communications */ 7135e7931f94SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_idxs);CHKERRQ(ierr); 7136e7931f94SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_vals);CHKERRQ(ierr); 713728143c3dSStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_idxs_is);CHKERRQ(ierr); 71381ae86dd6SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_vecs);CHKERRQ(ierr); 7139e7931f94SStefano Zampini 7140e7931f94SStefano Zampini /* allocate for requests */ 7141785e854fSJed Brown ierr = PetscMalloc1(n_sends,&send_req_idxs);CHKERRQ(ierr); 7142785e854fSJed Brown ierr = PetscMalloc1(n_sends,&send_req_vals);CHKERRQ(ierr); 714395ecbf38SStefano Zampini ierr = PetscMalloc1(n_sends,&send_req_idxs_is);CHKERRQ(ierr); 71441ae86dd6SStefano Zampini ierr = PetscMalloc1(n_sends,&send_req_vecs);CHKERRQ(ierr); 7145785e854fSJed Brown ierr = PetscMalloc1(n_recvs,&recv_req_idxs);CHKERRQ(ierr); 7146785e854fSJed Brown ierr = PetscMalloc1(n_recvs,&recv_req_vals);CHKERRQ(ierr); 714795ecbf38SStefano Zampini ierr = PetscMalloc1(n_recvs,&recv_req_idxs_is);CHKERRQ(ierr); 71481ae86dd6SStefano Zampini ierr = PetscMalloc1(n_recvs,&recv_req_vecs);CHKERRQ(ierr); 7149e7931f94SStefano Zampini 7150e7931f94SStefano Zampini /* communications */ 7151e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 7152e7931f94SStefano Zampini ptr_vals = recv_buffer_vals; 715328143c3dSStefano Zampini ptr_idxs_is = recv_buffer_idxs_is; 71541ae86dd6SStefano Zampini ptr_vecs = recv_buffer_vecs; 7155e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7156e7931f94SStefano Zampini source_dest = onodes[i]; 7157e7931f94SStefano Zampini ierr = MPI_Irecv(ptr_idxs,olengths_idxs[i],MPIU_INT,source_dest,tag_idxs,comm,&recv_req_idxs[i]);CHKERRQ(ierr); 7158e7931f94SStefano Zampini ierr = MPI_Irecv(ptr_vals,olengths_vals[i],MPIU_SCALAR,source_dest,tag_vals,comm,&recv_req_vals[i]);CHKERRQ(ierr); 7159e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7160e7931f94SStefano Zampini ptr_vals += olengths_vals[i]; 716128143c3dSStefano Zampini if (nis) { 716257de7509SStefano Zampini source_dest = onodes_is[i]; 716328143c3dSStefano Zampini ierr = MPI_Irecv(ptr_idxs_is,olengths_idxs_is[i],MPIU_INT,source_dest,tag_idxs_is,comm,&recv_req_idxs_is[i]);CHKERRQ(ierr); 716428143c3dSStefano Zampini ptr_idxs_is += olengths_idxs_is[i]; 716528143c3dSStefano Zampini } 71661ae86dd6SStefano Zampini if (nvecs) { 71671ae86dd6SStefano Zampini source_dest = onodes[i]; 71681ae86dd6SStefano Zampini ierr = MPI_Irecv(ptr_vecs,olengths_idxs[i]-2,MPIU_SCALAR,source_dest,tag_vecs,comm,&recv_req_vecs[i]);CHKERRQ(ierr); 71691ae86dd6SStefano Zampini ptr_vecs += olengths_idxs[i]-2; 71701ae86dd6SStefano Zampini } 7171e7931f94SStefano Zampini } 7172e7931f94SStefano Zampini for (i=0;i<n_sends;i++) { 7173e7931f94SStefano Zampini ierr = PetscMPIIntCast(is_indices[i],&source_dest);CHKERRQ(ierr); 7174e7931f94SStefano Zampini ierr = MPI_Isend(send_buffer_idxs,ilengths_idxs[source_dest],MPIU_INT,source_dest,tag_idxs,comm,&send_req_idxs[i]);CHKERRQ(ierr); 7175e7931f94SStefano Zampini ierr = MPI_Isend(send_buffer_vals,ilengths_vals[source_dest],MPIU_SCALAR,source_dest,tag_vals,comm,&send_req_vals[i]);CHKERRQ(ierr); 717628143c3dSStefano Zampini if (nis) { 717728143c3dSStefano Zampini ierr = MPI_Isend(send_buffer_idxs_is,ilengths_idxs_is[source_dest],MPIU_INT,source_dest,tag_idxs_is,comm,&send_req_idxs_is[i]);CHKERRQ(ierr); 717828143c3dSStefano Zampini } 71791ae86dd6SStefano Zampini if (nvecs) { 71801ae86dd6SStefano Zampini ierr = VecGetArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 71811ae86dd6SStefano Zampini ierr = MPI_Isend(send_buffer_vecs,ilengths_idxs[source_dest]-2,MPIU_SCALAR,source_dest,tag_vecs,comm,&send_req_vecs[i]);CHKERRQ(ierr); 71821ae86dd6SStefano Zampini } 7183e7931f94SStefano Zampini } 7184e7931f94SStefano Zampini ierr = ISRestoreIndices(is_sends_internal,&is_indices);CHKERRQ(ierr); 7185e7931f94SStefano Zampini ierr = ISDestroy(&is_sends_internal);CHKERRQ(ierr); 7186e7931f94SStefano Zampini 7187e7931f94SStefano Zampini /* assemble new l2g map */ 7188e7931f94SStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_idxs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7189e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 71909d30be91SStefano Zampini new_local_rows = 0; 7191e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 71929d30be91SStefano Zampini new_local_rows += *(ptr_idxs+1); /* second element is the local size of the l2gmap */ 7193e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7194e7931f94SStefano Zampini } 71959d30be91SStefano Zampini ierr = PetscMalloc1(new_local_rows,&l2gmap_indices);CHKERRQ(ierr); 7196e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 71979d30be91SStefano Zampini new_local_rows = 0; 7198e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 71999d30be91SStefano Zampini ierr = PetscMemcpy(&l2gmap_indices[new_local_rows],ptr_idxs+2,(*(ptr_idxs+1))*sizeof(PetscInt));CHKERRQ(ierr); 72009d30be91SStefano Zampini new_local_rows += *(ptr_idxs+1); /* second element is the local size of the l2gmap */ 7201e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7202e7931f94SStefano Zampini } 72039d30be91SStefano Zampini ierr = PetscSortRemoveDupsInt(&new_local_rows,l2gmap_indices);CHKERRQ(ierr); 72049d30be91SStefano Zampini ierr = ISLocalToGlobalMappingCreate(comm_n,1,new_local_rows,l2gmap_indices,PETSC_COPY_VALUES,&l2gmap);CHKERRQ(ierr); 7205e7931f94SStefano Zampini ierr = PetscFree(l2gmap_indices);CHKERRQ(ierr); 7206e7931f94SStefano Zampini 7207e7931f94SStefano Zampini /* infer new local matrix type from received local matrices type */ 7208e7931f94SStefano Zampini /* currently if all local matrices are of type X, then the resulting matrix will be of type X, except for the dense case */ 7209e7931f94SStefano Zampini /* it also assumes that if the block size is set, than it is the same among all local matrices (see checks at the beginning of the function) */ 7210e7931f94SStefano Zampini if (n_recvs) { 721128143c3dSStefano Zampini MatTypePrivate new_local_type_private = (MatTypePrivate)send_buffer_idxs[0]; 7212e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 7213e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7214e7931f94SStefano Zampini if ((PetscInt)new_local_type_private != *ptr_idxs) { 7215e7931f94SStefano Zampini new_local_type_private = MATAIJ_PRIVATE; 7216e7931f94SStefano Zampini break; 7217e7931f94SStefano Zampini } 7218e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7219e7931f94SStefano Zampini } 7220e7931f94SStefano Zampini switch (new_local_type_private) { 722128143c3dSStefano Zampini case MATDENSE_PRIVATE: 7222e7931f94SStefano Zampini new_local_type = MATSEQAIJ; 7223e7931f94SStefano Zampini bs = 1; 7224e7931f94SStefano Zampini break; 7225e7931f94SStefano Zampini case MATAIJ_PRIVATE: 7226e7931f94SStefano Zampini new_local_type = MATSEQAIJ; 7227e7931f94SStefano Zampini bs = 1; 7228e7931f94SStefano Zampini break; 7229e7931f94SStefano Zampini case MATBAIJ_PRIVATE: 7230e7931f94SStefano Zampini new_local_type = MATSEQBAIJ; 7231e7931f94SStefano Zampini break; 7232e7931f94SStefano Zampini case MATSBAIJ_PRIVATE: 7233e7931f94SStefano Zampini new_local_type = MATSEQSBAIJ; 7234e7931f94SStefano Zampini break; 7235e7931f94SStefano Zampini default: 7236fbfcfee5SBarry Smith SETERRQ2(comm,PETSC_ERR_SUP,"Unsupported private type %d in %s",new_local_type_private,PETSC_FUNCTION_NAME); 7237e7931f94SStefano Zampini break; 7238e7931f94SStefano Zampini } 7239ed8ed4edSstefano_zampini } else { /* by default, new_local_type is seqaij */ 7240ed8ed4edSstefano_zampini new_local_type = MATSEQAIJ; 724128143c3dSStefano Zampini bs = 1; 7242e7931f94SStefano Zampini } 7243e7931f94SStefano Zampini 724470cf5478SStefano Zampini /* create MATIS object if needed */ 724557de7509SStefano Zampini if (!reuse) { 7246e7931f94SStefano Zampini ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 7247e176bc59SStefano Zampini ierr = MatCreateIS(comm_n,bs,PETSC_DECIDE,PETSC_DECIDE,rows,cols,l2gmap,NULL,mat_n);CHKERRQ(ierr); 724870cf5478SStefano Zampini } else { 724970cf5478SStefano Zampini /* it also destroys the local matrices */ 725057de7509SStefano Zampini if (*mat_n) { 725170cf5478SStefano Zampini ierr = MatSetLocalToGlobalMapping(*mat_n,l2gmap,l2gmap);CHKERRQ(ierr); 725257de7509SStefano Zampini } else { /* this is a fake object */ 725357de7509SStefano Zampini ierr = MatCreateIS(comm_n,bs,PETSC_DECIDE,PETSC_DECIDE,rows,cols,l2gmap,NULL,mat_n);CHKERRQ(ierr); 725457de7509SStefano Zampini } 725570cf5478SStefano Zampini } 725670cf5478SStefano Zampini ierr = MatISGetLocalMat(*mat_n,&local_mat);CHKERRQ(ierr); 7257e7931f94SStefano Zampini ierr = MatSetType(local_mat,new_local_type);CHKERRQ(ierr); 72589d30be91SStefano Zampini 72599d30be91SStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_vals,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 72609d30be91SStefano Zampini 72619d30be91SStefano Zampini /* Global to local map of received indices */ 72629d30be91SStefano Zampini ierr = PetscMalloc1(buf_size_idxs,&recv_buffer_idxs_local);CHKERRQ(ierr); /* needed for values insertion */ 72639d30be91SStefano Zampini ierr = ISGlobalToLocalMappingApply(l2gmap,IS_GTOLM_MASK,buf_size_idxs,recv_buffer_idxs,&i,recv_buffer_idxs_local);CHKERRQ(ierr); 72649d30be91SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2gmap);CHKERRQ(ierr); 72659d30be91SStefano Zampini 72669d30be91SStefano Zampini /* restore attributes -> type of incoming data and its size */ 72679d30be91SStefano Zampini buf_size_idxs = 0; 72689d30be91SStefano Zampini for (i=0;i<n_recvs;i++) { 72699d30be91SStefano Zampini recv_buffer_idxs_local[buf_size_idxs] = recv_buffer_idxs[buf_size_idxs]; 72709d30be91SStefano Zampini recv_buffer_idxs_local[buf_size_idxs+1] = recv_buffer_idxs[buf_size_idxs+1]; 72719d30be91SStefano Zampini buf_size_idxs += (PetscInt)olengths_idxs[i]; 72729d30be91SStefano Zampini } 72739d30be91SStefano Zampini ierr = PetscFree(recv_buffer_idxs);CHKERRQ(ierr); 72749d30be91SStefano Zampini 72759d30be91SStefano Zampini /* set preallocation */ 72769d30be91SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)local_mat,MATSEQDENSE,&newisdense);CHKERRQ(ierr); 72779d30be91SStefano Zampini if (!newisdense) { 72789d30be91SStefano Zampini PetscInt *new_local_nnz=0; 72799d30be91SStefano Zampini 72809d30be91SStefano Zampini ptr_idxs = recv_buffer_idxs_local; 72819d30be91SStefano Zampini if (n_recvs) { 72829d30be91SStefano Zampini ierr = PetscCalloc1(new_local_rows,&new_local_nnz);CHKERRQ(ierr); 72839d30be91SStefano Zampini } 72849d30be91SStefano Zampini for (i=0;i<n_recvs;i++) { 72859d30be91SStefano Zampini PetscInt j; 72869d30be91SStefano Zampini if (*ptr_idxs == (PetscInt)MATDENSE_PRIVATE) { /* preallocation provided for dense case only */ 72879d30be91SStefano Zampini for (j=0;j<*(ptr_idxs+1);j++) { 72889d30be91SStefano Zampini new_local_nnz[*(ptr_idxs+2+j)] += *(ptr_idxs+1); 72899d30be91SStefano Zampini } 72909d30be91SStefano Zampini } else { 72919d30be91SStefano Zampini /* TODO */ 72929d30be91SStefano Zampini } 72939d30be91SStefano Zampini ptr_idxs += olengths_idxs[i]; 72949d30be91SStefano Zampini } 72959d30be91SStefano Zampini if (new_local_nnz) { 72969d30be91SStefano Zampini for (i=0;i<new_local_rows;i++) new_local_nnz[i] = PetscMin(new_local_nnz[i],new_local_rows); 72979d30be91SStefano Zampini ierr = MatSeqAIJSetPreallocation(local_mat,0,new_local_nnz);CHKERRQ(ierr); 72989d30be91SStefano Zampini for (i=0;i<new_local_rows;i++) new_local_nnz[i] /= bs; 72999d30be91SStefano Zampini ierr = MatSeqBAIJSetPreallocation(local_mat,bs,0,new_local_nnz);CHKERRQ(ierr); 73009d30be91SStefano Zampini for (i=0;i<new_local_rows;i++) new_local_nnz[i] = PetscMax(new_local_nnz[i]-i,0); 73019d30be91SStefano Zampini ierr = MatSeqSBAIJSetPreallocation(local_mat,bs,0,new_local_nnz);CHKERRQ(ierr); 73029d30be91SStefano Zampini } else { 73039d30be91SStefano Zampini ierr = MatSetUp(local_mat);CHKERRQ(ierr); 73049d30be91SStefano Zampini } 73059d30be91SStefano Zampini ierr = PetscFree(new_local_nnz);CHKERRQ(ierr); 73069d30be91SStefano Zampini } else { 73079d30be91SStefano Zampini ierr = MatSetUp(local_mat);CHKERRQ(ierr); 73089d30be91SStefano Zampini } 7309e7931f94SStefano Zampini 7310e7931f94SStefano Zampini /* set values */ 7311e7931f94SStefano Zampini ptr_vals = recv_buffer_vals; 73129d30be91SStefano Zampini ptr_idxs = recv_buffer_idxs_local; 7313e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7314e7931f94SStefano Zampini if (*ptr_idxs == (PetscInt)MATDENSE_PRIVATE) { /* values insertion provided for dense case only */ 7315e7931f94SStefano Zampini ierr = MatSetOption(local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); 73169d30be91SStefano Zampini ierr = MatSetValues(local_mat,*(ptr_idxs+1),ptr_idxs+2,*(ptr_idxs+1),ptr_idxs+2,ptr_vals,ADD_VALUES);CHKERRQ(ierr); 7317e7931f94SStefano Zampini ierr = MatAssemblyBegin(local_mat,MAT_FLUSH_ASSEMBLY);CHKERRQ(ierr); 7318e7931f94SStefano Zampini ierr = MatAssemblyEnd(local_mat,MAT_FLUSH_ASSEMBLY);CHKERRQ(ierr); 7319e7931f94SStefano Zampini ierr = MatSetOption(local_mat,MAT_ROW_ORIENTED,PETSC_TRUE);CHKERRQ(ierr); 732028143c3dSStefano Zampini } else { 732128143c3dSStefano Zampini /* TODO */ 7322e7931f94SStefano Zampini } 7323e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7324e7931f94SStefano Zampini ptr_vals += olengths_vals[i]; 7325e7931f94SStefano Zampini } 7326e7931f94SStefano Zampini ierr = MatAssemblyBegin(local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 7327e7931f94SStefano Zampini ierr = MatAssemblyEnd(local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 73283b3b1effSJed Brown ierr = MatISRestoreLocalMat(*mat_n,&local_mat);CHKERRQ(ierr); 732970cf5478SStefano Zampini ierr = MatAssemblyBegin(*mat_n,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 733070cf5478SStefano Zampini ierr = MatAssemblyEnd(*mat_n,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 73319d30be91SStefano Zampini ierr = PetscFree(recv_buffer_vals);CHKERRQ(ierr); 7332e7931f94SStefano Zampini 7333dfd14d43SStefano Zampini #if 0 733428143c3dSStefano Zampini if (!restrict_comm) { /* check */ 7335e7931f94SStefano Zampini Vec lvec,rvec; 7336e7931f94SStefano Zampini PetscReal infty_error; 7337e7931f94SStefano Zampini 73382a7a6963SBarry Smith ierr = MatCreateVecs(mat,&rvec,&lvec);CHKERRQ(ierr); 7339e7931f94SStefano Zampini ierr = VecSetRandom(rvec,NULL);CHKERRQ(ierr); 7340e7931f94SStefano Zampini ierr = MatMult(mat,rvec,lvec);CHKERRQ(ierr); 7341e7931f94SStefano Zampini ierr = VecScale(lvec,-1.0);CHKERRQ(ierr); 734270cf5478SStefano Zampini ierr = MatMultAdd(*mat_n,rvec,lvec,lvec);CHKERRQ(ierr); 7343e7931f94SStefano Zampini ierr = VecNorm(lvec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 7344e7931f94SStefano Zampini ierr = PetscPrintf(PetscObjectComm((PetscObject)mat),"Infinity error subassembling %1.6e\n",infty_error); 7345e7931f94SStefano Zampini ierr = VecDestroy(&rvec);CHKERRQ(ierr); 7346e7931f94SStefano Zampini ierr = VecDestroy(&lvec);CHKERRQ(ierr); 7347e7931f94SStefano Zampini } 734828143c3dSStefano Zampini #endif 7349e7931f94SStefano Zampini 735028143c3dSStefano Zampini /* assemble new additional is (if any) */ 735128143c3dSStefano Zampini if (nis) { 735228143c3dSStefano Zampini PetscInt **temp_idxs,*count_is,j,psum; 735328143c3dSStefano Zampini 735428143c3dSStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_idxs_is,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7355854ce69bSBarry Smith ierr = PetscCalloc1(nis,&count_is);CHKERRQ(ierr); 735628143c3dSStefano Zampini ptr_idxs = recv_buffer_idxs_is; 735728143c3dSStefano Zampini psum = 0; 735828143c3dSStefano Zampini for (i=0;i<n_recvs;i++) { 735928143c3dSStefano Zampini for (j=0;j<nis;j++) { 736028143c3dSStefano Zampini PetscInt plen = *(ptr_idxs); /* first element is the local size of IS's indices */ 736128143c3dSStefano Zampini count_is[j] += plen; /* increment counting of buffer for j-th IS */ 736228143c3dSStefano Zampini psum += plen; 736328143c3dSStefano Zampini ptr_idxs += plen+1; /* shift pointer to received data */ 736428143c3dSStefano Zampini } 736528143c3dSStefano Zampini } 7366854ce69bSBarry Smith ierr = PetscMalloc1(nis,&temp_idxs);CHKERRQ(ierr); 7367854ce69bSBarry Smith ierr = PetscMalloc1(psum,&temp_idxs[0]);CHKERRQ(ierr); 736828143c3dSStefano Zampini for (i=1;i<nis;i++) { 736928143c3dSStefano Zampini temp_idxs[i] = temp_idxs[i-1]+count_is[i-1]; 737028143c3dSStefano Zampini } 737128143c3dSStefano Zampini ierr = PetscMemzero(count_is,nis*sizeof(PetscInt));CHKERRQ(ierr); 737228143c3dSStefano Zampini ptr_idxs = recv_buffer_idxs_is; 737328143c3dSStefano Zampini for (i=0;i<n_recvs;i++) { 737428143c3dSStefano Zampini for (j=0;j<nis;j++) { 737528143c3dSStefano Zampini PetscInt plen = *(ptr_idxs); /* first element is the local size of IS's indices */ 737628143c3dSStefano Zampini ierr = PetscMemcpy(&temp_idxs[j][count_is[j]],ptr_idxs+1,plen*sizeof(PetscInt));CHKERRQ(ierr); 737728143c3dSStefano Zampini count_is[j] += plen; /* increment starting point of buffer for j-th IS */ 737828143c3dSStefano Zampini ptr_idxs += plen+1; /* shift pointer to received data */ 737928143c3dSStefano Zampini } 738028143c3dSStefano Zampini } 738128143c3dSStefano Zampini for (i=0;i<nis;i++) { 738228143c3dSStefano Zampini ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr); 738328143c3dSStefano Zampini ierr = PetscSortRemoveDupsInt(&count_is[i],temp_idxs[i]);CHKERRQ(ierr);CHKERRQ(ierr); 738428143c3dSStefano Zampini ierr = ISCreateGeneral(comm_n,count_is[i],temp_idxs[i],PETSC_COPY_VALUES,&isarray[i]);CHKERRQ(ierr); 738528143c3dSStefano Zampini } 738628143c3dSStefano Zampini ierr = PetscFree(count_is);CHKERRQ(ierr); 738728143c3dSStefano Zampini ierr = PetscFree(temp_idxs[0]);CHKERRQ(ierr); 738828143c3dSStefano Zampini ierr = PetscFree(temp_idxs);CHKERRQ(ierr); 738928143c3dSStefano Zampini } 7390e7931f94SStefano Zampini /* free workspace */ 739128143c3dSStefano Zampini ierr = PetscFree(recv_buffer_idxs_is);CHKERRQ(ierr); 7392e7931f94SStefano Zampini ierr = MPI_Waitall(n_sends,send_req_idxs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7393e7931f94SStefano Zampini ierr = PetscFree(send_buffer_idxs);CHKERRQ(ierr); 7394e7931f94SStefano Zampini ierr = MPI_Waitall(n_sends,send_req_vals,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7395e7931f94SStefano Zampini if (isdense) { 7396e7931f94SStefano Zampini ierr = MatISGetLocalMat(mat,&local_mat);CHKERRQ(ierr); 7397e7931f94SStefano Zampini ierr = MatDenseRestoreArray(local_mat,&send_buffer_vals);CHKERRQ(ierr); 73983b3b1effSJed Brown ierr = MatISRestoreLocalMat(mat,&local_mat);CHKERRQ(ierr); 7399e7931f94SStefano Zampini } else { 7400e7931f94SStefano Zampini /* ierr = PetscFree(send_buffer_vals);CHKERRQ(ierr); */ 7401e7931f94SStefano Zampini } 740228143c3dSStefano Zampini if (nis) { 740328143c3dSStefano Zampini ierr = MPI_Waitall(n_sends,send_req_idxs_is,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 740428143c3dSStefano Zampini ierr = PetscFree(send_buffer_idxs_is);CHKERRQ(ierr); 740528143c3dSStefano Zampini } 74061ae86dd6SStefano Zampini 74071ae86dd6SStefano Zampini if (nvecs) { 74081ae86dd6SStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_vecs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 74091ae86dd6SStefano Zampini ierr = MPI_Waitall(n_sends,send_req_vecs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 74101ae86dd6SStefano Zampini ierr = VecRestoreArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 74111ae86dd6SStefano Zampini ierr = VecDestroy(&nnsp_vec[0]);CHKERRQ(ierr); 74121ae86dd6SStefano Zampini ierr = VecCreate(comm_n,&nnsp_vec[0]);CHKERRQ(ierr); 74131ae86dd6SStefano Zampini ierr = VecSetSizes(nnsp_vec[0],new_local_rows,PETSC_DECIDE);CHKERRQ(ierr); 74141ae86dd6SStefano Zampini ierr = VecSetType(nnsp_vec[0],VECSTANDARD);CHKERRQ(ierr); 74151ae86dd6SStefano Zampini /* set values */ 74161ae86dd6SStefano Zampini ptr_vals = recv_buffer_vecs; 74171ae86dd6SStefano Zampini ptr_idxs = recv_buffer_idxs_local; 74181ae86dd6SStefano Zampini ierr = VecGetArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 74191ae86dd6SStefano Zampini for (i=0;i<n_recvs;i++) { 74201ae86dd6SStefano Zampini PetscInt j; 74211ae86dd6SStefano Zampini for (j=0;j<*(ptr_idxs+1);j++) { 74221ae86dd6SStefano Zampini send_buffer_vecs[*(ptr_idxs+2+j)] += *(ptr_vals + j); 74231ae86dd6SStefano Zampini } 74241ae86dd6SStefano Zampini ptr_idxs += olengths_idxs[i]; 74251ae86dd6SStefano Zampini ptr_vals += olengths_idxs[i]-2; 74261ae86dd6SStefano Zampini } 74271ae86dd6SStefano Zampini ierr = VecRestoreArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 74281ae86dd6SStefano Zampini ierr = VecAssemblyBegin(nnsp_vec[0]);CHKERRQ(ierr); 74291ae86dd6SStefano Zampini ierr = VecAssemblyEnd(nnsp_vec[0]);CHKERRQ(ierr); 74301ae86dd6SStefano Zampini } 74311ae86dd6SStefano Zampini 74321ae86dd6SStefano Zampini ierr = PetscFree(recv_buffer_vecs);CHKERRQ(ierr); 74331ae86dd6SStefano Zampini ierr = PetscFree(recv_buffer_idxs_local);CHKERRQ(ierr); 7434e7931f94SStefano Zampini ierr = PetscFree(recv_req_idxs);CHKERRQ(ierr); 7435e7931f94SStefano Zampini ierr = PetscFree(recv_req_vals);CHKERRQ(ierr); 74361ae86dd6SStefano Zampini ierr = PetscFree(recv_req_vecs);CHKERRQ(ierr); 743728143c3dSStefano Zampini ierr = PetscFree(recv_req_idxs_is);CHKERRQ(ierr); 7438e7931f94SStefano Zampini ierr = PetscFree(send_req_idxs);CHKERRQ(ierr); 7439e7931f94SStefano Zampini ierr = PetscFree(send_req_vals);CHKERRQ(ierr); 74401ae86dd6SStefano Zampini ierr = PetscFree(send_req_vecs);CHKERRQ(ierr); 744128143c3dSStefano Zampini ierr = PetscFree(send_req_idxs_is);CHKERRQ(ierr); 7442e7931f94SStefano Zampini ierr = PetscFree(ilengths_vals);CHKERRQ(ierr); 7443e7931f94SStefano Zampini ierr = PetscFree(ilengths_idxs);CHKERRQ(ierr); 7444e7931f94SStefano Zampini ierr = PetscFree(olengths_vals);CHKERRQ(ierr); 7445e7931f94SStefano Zampini ierr = PetscFree(olengths_idxs);CHKERRQ(ierr); 7446e7931f94SStefano Zampini ierr = PetscFree(onodes);CHKERRQ(ierr); 744728143c3dSStefano Zampini if (nis) { 744828143c3dSStefano Zampini ierr = PetscFree(ilengths_idxs_is);CHKERRQ(ierr); 744928143c3dSStefano Zampini ierr = PetscFree(olengths_idxs_is);CHKERRQ(ierr); 745028143c3dSStefano Zampini ierr = PetscFree(onodes_is);CHKERRQ(ierr); 745128143c3dSStefano Zampini } 745228143c3dSStefano Zampini ierr = PetscSubcommDestroy(&subcomm);CHKERRQ(ierr); 745328143c3dSStefano Zampini if (destroy_mat) { /* destroy mat is true only if restrict comm is true and process will not partecipate */ 745428143c3dSStefano Zampini ierr = MatDestroy(mat_n);CHKERRQ(ierr); 745528143c3dSStefano Zampini for (i=0;i<nis;i++) { 745628143c3dSStefano Zampini ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr); 745728143c3dSStefano Zampini } 74581ae86dd6SStefano Zampini if (nvecs) { /* need to match VecDestroy nnsp_vec called in the other code path */ 74591ae86dd6SStefano Zampini ierr = VecDestroy(&nnsp_vec[0]);CHKERRQ(ierr); 74601ae86dd6SStefano Zampini } 746153a05cb3SStefano Zampini *mat_n = NULL; 746228143c3dSStefano Zampini } 7463e7931f94SStefano Zampini PetscFunctionReturn(0); 7464e7931f94SStefano Zampini } 7465a57a6d2fSStefano Zampini 746612edc857SStefano Zampini /* temporary hack into ksp private data structure */ 7467af0996ceSBarry Smith #include <petsc/private/kspimpl.h> 746812edc857SStefano Zampini 7469c8587f34SStefano Zampini PetscErrorCode PCBDDCSetUpCoarseSolver(PC pc,PetscScalar* coarse_submat_vals) 7470c8587f34SStefano Zampini { 7471c8587f34SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 7472c8587f34SStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 747320a2ab83SStefano Zampini Mat coarse_mat,coarse_mat_is,coarse_submat_dense; 74741ae86dd6SStefano Zampini Mat coarsedivudotp = NULL; 74751e0482f5SStefano Zampini Mat coarseG,t_coarse_mat_is; 74769881197aSStefano Zampini MatNullSpace CoarseNullSpace = NULL; 747720a2ab83SStefano Zampini ISLocalToGlobalMapping coarse_islg; 74786e683305SStefano Zampini IS coarse_is,*isarray; 74796e683305SStefano Zampini PetscInt i,im_active=-1,active_procs=-1; 748030368db7SStefano Zampini PetscInt nis,nisdofs,nisneu,nisvert; 7481f9eb5b7dSStefano Zampini PC pc_temp; 7482c8587f34SStefano Zampini PCType coarse_pc_type; 7483c8587f34SStefano Zampini KSPType coarse_ksp_type; 7484f9eb5b7dSStefano Zampini PetscBool multilevel_requested,multilevel_allowed; 74857274672aSStefano Zampini PetscBool coarse_reuse; 74861e0482f5SStefano Zampini PetscInt ncoarse,nedcfield; 748768457ee5SStefano Zampini PetscBool compute_vecs = PETSC_FALSE; 748822bc73bbSStefano Zampini PetscScalar *array; 748957de7509SStefano Zampini MatReuse coarse_mat_reuse; 749057de7509SStefano Zampini PetscBool restr, full_restr, have_void; 74917de4f681Sstefano_zampini PetscMPIInt commsize; 74929881197aSStefano Zampini PetscErrorCode ierr; 7493fdc09c96SStefano Zampini 7494c8587f34SStefano Zampini PetscFunctionBegin; 7495c8587f34SStefano Zampini /* Assign global numbering to coarse dofs */ 749668457ee5SStefano Zampini if (pcbddc->new_primal_space || pcbddc->coarse_size == -1) { /* a new primal space is present or it is the first initialization, so recompute global numbering */ 7497fa7f1dd8SStefano Zampini PetscInt ocoarse_size; 74985a75c04eSSatish Balay compute_vecs = PETSC_TRUE; 74997de4f681Sstefano_zampini 75007de4f681Sstefano_zampini pcbddc->new_primal_space = PETSC_TRUE; 7501fa7f1dd8SStefano Zampini ocoarse_size = pcbddc->coarse_size; 7502f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->global_primal_indices);CHKERRQ(ierr); 7503f4ddd8eeSStefano Zampini ierr = PCBDDCComputePrimalNumbering(pc,&pcbddc->coarse_size,&pcbddc->global_primal_indices);CHKERRQ(ierr); 7504f4ddd8eeSStefano Zampini /* see if we can avoid some work */ 7505fa7f1dd8SStefano Zampini if (pcbddc->coarse_ksp) { /* coarse ksp has already been created */ 750651bea450SStefano Zampini /* if the coarse size is different or we are using adaptive selection, better to not reuse the coarse matrix */ 750751bea450SStefano Zampini if (ocoarse_size != pcbddc->coarse_size || pcbddc->adaptive_selection) { 7508727cdba6SStefano Zampini ierr = KSPReset(pcbddc->coarse_ksp);CHKERRQ(ierr); 7509fa7f1dd8SStefano Zampini coarse_reuse = PETSC_FALSE; 7510fa7f1dd8SStefano Zampini } else { /* we can safely reuse already computed coarse matrix */ 7511fa7f1dd8SStefano Zampini coarse_reuse = PETSC_TRUE; 7512f4ddd8eeSStefano Zampini } 7513fa7f1dd8SStefano Zampini } else { /* there's no coarse ksp, so we need to create the coarse matrix too */ 7514fa7f1dd8SStefano Zampini coarse_reuse = PETSC_FALSE; 7515f4ddd8eeSStefano Zampini } 751670cf5478SStefano Zampini /* reset any subassembling information */ 751757de7509SStefano Zampini if (!coarse_reuse || pcbddc->recompute_topography) { 751870cf5478SStefano Zampini ierr = ISDestroy(&pcbddc->coarse_subassembling);CHKERRQ(ierr); 751957de7509SStefano Zampini } 75206e683305SStefano Zampini } else { /* primal space is unchanged, so we can reuse coarse matrix */ 7521fa7f1dd8SStefano Zampini coarse_reuse = PETSC_TRUE; 7522f4ddd8eeSStefano Zampini } 752357de7509SStefano Zampini /* assemble coarse matrix */ 752457de7509SStefano Zampini if (coarse_reuse && pcbddc->coarse_ksp) { 752557de7509SStefano Zampini ierr = KSPGetOperators(pcbddc->coarse_ksp,&coarse_mat,NULL);CHKERRQ(ierr); 752657de7509SStefano Zampini ierr = PetscObjectReference((PetscObject)coarse_mat);CHKERRQ(ierr); 752757de7509SStefano Zampini coarse_mat_reuse = MAT_REUSE_MATRIX; 752818a45a71SStefano Zampini } else { 752957de7509SStefano Zampini coarse_mat = NULL; 753057de7509SStefano Zampini coarse_mat_reuse = MAT_INITIAL_MATRIX; 75316e683305SStefano Zampini } 7532e7931f94SStefano Zampini 7533abbbba34SStefano Zampini /* creates temporary l2gmap and IS for coarse indexes */ 7534abbbba34SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),pcbddc->local_primal_size,pcbddc->global_primal_indices,PETSC_COPY_VALUES,&coarse_is);CHKERRQ(ierr); 7535abbbba34SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(coarse_is,&coarse_islg);CHKERRQ(ierr); 7536abbbba34SStefano Zampini 7537abbbba34SStefano Zampini /* creates temporary MATIS object for coarse matrix */ 753822bc73bbSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,NULL,&coarse_submat_dense);CHKERRQ(ierr); 753922bc73bbSStefano Zampini ierr = MatDenseGetArray(coarse_submat_dense,&array);CHKERRQ(ierr); 754022bc73bbSStefano Zampini ierr = PetscMemcpy(array,coarse_submat_vals,sizeof(*coarse_submat_vals)*pcbddc->local_primal_size*pcbddc->local_primal_size);CHKERRQ(ierr); 754122bc73bbSStefano Zampini ierr = MatDenseRestoreArray(coarse_submat_dense,&array);CHKERRQ(ierr); 7542e176bc59SStefano Zampini ierr = MatCreateIS(PetscObjectComm((PetscObject)pc),1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_islg,NULL,&t_coarse_mat_is);CHKERRQ(ierr); 75436e683305SStefano Zampini ierr = MatISSetLocalMat(t_coarse_mat_is,coarse_submat_dense);CHKERRQ(ierr); 75446e683305SStefano Zampini ierr = MatAssemblyBegin(t_coarse_mat_is,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 75456e683305SStefano Zampini ierr = MatAssemblyEnd(t_coarse_mat_is,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 7546abbbba34SStefano Zampini ierr = MatDestroy(&coarse_submat_dense);CHKERRQ(ierr); 7547abbbba34SStefano Zampini 754857de7509SStefano Zampini /* count "active" (i.e. with positive local size) and "void" processes */ 754957de7509SStefano Zampini im_active = !!(pcis->n); 755057de7509SStefano Zampini ierr = MPIU_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 755157de7509SStefano Zampini 755214f0bfb9SStefano Zampini /* determine number of processes partecipating to coarse solver and compute subassembling pattern */ 755357de7509SStefano Zampini /* restr : whether if we want to exclude senders (which are not receivers) from the subassembling pattern */ 755457de7509SStefano Zampini /* full_restr : just use the receivers from the subassembling pattern */ 75557de4f681Sstefano_zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)pc),&commsize);CHKERRQ(ierr); 755657de7509SStefano Zampini coarse_mat_is = NULL; 755757de7509SStefano Zampini multilevel_allowed = PETSC_FALSE; 755857de7509SStefano Zampini multilevel_requested = PETSC_FALSE; 75591ae86dd6SStefano Zampini pcbddc->coarse_eqs_per_proc = PetscMin(PetscMax(pcbddc->coarse_size,1),pcbddc->coarse_eqs_per_proc); 756057de7509SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) multilevel_requested = PETSC_TRUE; 756157de7509SStefano Zampini if (multilevel_requested) { 756257de7509SStefano Zampini ncoarse = active_procs/pcbddc->coarsening_ratio; 756357de7509SStefano Zampini restr = PETSC_FALSE; 756457de7509SStefano Zampini full_restr = PETSC_FALSE; 756557de7509SStefano Zampini } else { 756657de7509SStefano Zampini ncoarse = pcbddc->coarse_size/pcbddc->coarse_eqs_per_proc; 756757de7509SStefano Zampini restr = PETSC_TRUE; 756857de7509SStefano Zampini full_restr = PETSC_TRUE; 756957de7509SStefano Zampini } 75707de4f681Sstefano_zampini if (!pcbddc->coarse_size || commsize == 1) multilevel_allowed = multilevel_requested = restr = full_restr = PETSC_FALSE; 757157de7509SStefano Zampini ncoarse = PetscMax(1,ncoarse); 757257de7509SStefano Zampini if (!pcbddc->coarse_subassembling) { 7573a198735bSStefano Zampini if (pcbddc->coarsening_ratio > 1) { 7574bb360cb4SStefano Zampini if (multilevel_requested) { 7575bb360cb4SStefano Zampini ierr = PCBDDCMatISGetSubassemblingPattern(pc->pmat,&ncoarse,pcbddc->coarse_adj_red,&pcbddc->coarse_subassembling,&have_void);CHKERRQ(ierr); 7576bb360cb4SStefano Zampini } else { 7577bb360cb4SStefano Zampini ierr = PCBDDCMatISGetSubassemblingPattern(t_coarse_mat_is,&ncoarse,pcbddc->coarse_adj_red,&pcbddc->coarse_subassembling,&have_void);CHKERRQ(ierr); 7578bb360cb4SStefano Zampini } 7579a198735bSStefano Zampini } else { 75807de4f681Sstefano_zampini PetscMPIInt rank; 7581a198735bSStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)pc),&rank);CHKERRQ(ierr); 75827de4f681Sstefano_zampini have_void = (active_procs == (PetscInt)commsize) ? PETSC_FALSE : PETSC_TRUE; 7583a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),1,rank,1,&pcbddc->coarse_subassembling);CHKERRQ(ierr); 7584a198735bSStefano Zampini } 758557de7509SStefano Zampini } else { /* if a subassembling pattern exists, then we can reuse the coarse ksp and compute the number of process involved */ 758657de7509SStefano Zampini PetscInt psum; 758757de7509SStefano Zampini if (pcbddc->coarse_ksp) psum = 1; 758857de7509SStefano Zampini else psum = 0; 758957de7509SStefano Zampini ierr = MPIU_Allreduce(&psum,&ncoarse,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 75907de4f681Sstefano_zampini if (ncoarse < commsize) have_void = PETSC_TRUE; 759157de7509SStefano Zampini } 759257de7509SStefano Zampini /* determine if we can go multilevel */ 759357de7509SStefano Zampini if (multilevel_requested) { 759457de7509SStefano Zampini if (ncoarse > 1) multilevel_allowed = PETSC_TRUE; /* found enough processes */ 759557de7509SStefano Zampini else restr = full_restr = PETSC_TRUE; /* 1 subdomain, use a direct solver */ 759657de7509SStefano Zampini } 759757de7509SStefano Zampini if (multilevel_allowed && have_void) restr = PETSC_TRUE; 759857de7509SStefano Zampini 7599e4d548c7SStefano Zampini /* dump subassembling pattern */ 7600e4d548c7SStefano Zampini if (pcbddc->dbg_flag && multilevel_allowed) { 7601e4d548c7SStefano Zampini ierr = ISView(pcbddc->coarse_subassembling,pcbddc->dbg_viewer);CHKERRQ(ierr); 7602e4d548c7SStefano Zampini } 7603e4d548c7SStefano Zampini 76046e683305SStefano Zampini /* compute dofs splitting and neumann boundaries for coarse dofs */ 76051e0482f5SStefano Zampini nedcfield = -1; 76061e0482f5SStefano Zampini if (multilevel_allowed && !coarse_reuse && (pcbddc->n_ISForDofsLocal || pcbddc->NeumannBoundariesLocal || pcbddc->nedclocal)) { /* protects from unneded computations */ 76076e683305SStefano Zampini PetscInt *tidxs,*tidxs2,nout,tsize,i; 76086e683305SStefano Zampini const PetscInt *idxs; 76096e683305SStefano Zampini ISLocalToGlobalMapping tmap; 76106e683305SStefano Zampini 76116e683305SStefano Zampini /* create map between primal indices (in local representative ordering) and local primal numbering */ 76120be93d54SStefano Zampini ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,1,pcbddc->local_primal_size,pcbddc->primal_indices_local_idxs,PETSC_COPY_VALUES,&tmap);CHKERRQ(ierr); 76136e683305SStefano Zampini /* allocate space for temporary storage */ 7614854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->local_primal_size,&tidxs);CHKERRQ(ierr); 7615854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->local_primal_size,&tidxs2);CHKERRQ(ierr); 76166e683305SStefano Zampini /* allocate for IS array */ 76176e683305SStefano Zampini nisdofs = pcbddc->n_ISForDofsLocal; 76181e0482f5SStefano Zampini if (pcbddc->nedclocal) { 76191e0482f5SStefano Zampini if (pcbddc->nedfield > -1) { 76201e0482f5SStefano Zampini nedcfield = pcbddc->nedfield; 76211e0482f5SStefano Zampini } else { 76221e0482f5SStefano Zampini nedcfield = 0; 76231e0482f5SStefano Zampini if (nisdofs) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"This should not happen (%d)",nisdofs); 76241e0482f5SStefano Zampini nisdofs = 1; 76251e0482f5SStefano Zampini } 76261e0482f5SStefano Zampini } 76276e683305SStefano Zampini nisneu = !!pcbddc->NeumannBoundariesLocal; 762827b6a85dSStefano Zampini nisvert = 0; /* nisvert is not used */ 762930368db7SStefano Zampini nis = nisdofs + nisneu + nisvert; 7630854ce69bSBarry Smith ierr = PetscMalloc1(nis,&isarray);CHKERRQ(ierr); 76316e683305SStefano Zampini /* dofs splitting */ 76326e683305SStefano Zampini for (i=0;i<nisdofs;i++) { 76336e683305SStefano Zampini /* ierr = ISView(pcbddc->ISForDofsLocal[i],0);CHKERRQ(ierr); */ 76341e0482f5SStefano Zampini if (nedcfield != i) { 76356e683305SStefano Zampini ierr = ISGetLocalSize(pcbddc->ISForDofsLocal[i],&tsize);CHKERRQ(ierr); 76366e683305SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofsLocal[i],&idxs);CHKERRQ(ierr); 76376e683305SStefano Zampini ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr); 76386e683305SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofsLocal[i],&idxs);CHKERRQ(ierr); 76391e0482f5SStefano Zampini } else { 76401e0482f5SStefano Zampini ierr = ISGetLocalSize(pcbddc->nedclocal,&tsize);CHKERRQ(ierr); 76411e0482f5SStefano Zampini ierr = ISGetIndices(pcbddc->nedclocal,&idxs);CHKERRQ(ierr); 76421e0482f5SStefano Zampini ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr); 7643eee23b56SStefano Zampini if (tsize != nout) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Failed when mapping coarse nedelec field! %d != %d\n",tsize,nout); 76441e0482f5SStefano Zampini ierr = ISRestoreIndices(pcbddc->nedclocal,&idxs);CHKERRQ(ierr); 76451e0482f5SStefano Zampini } 76466e683305SStefano Zampini ierr = ISLocalToGlobalMappingApply(coarse_islg,nout,tidxs,tidxs2);CHKERRQ(ierr); 764730368db7SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),nout,tidxs2,PETSC_COPY_VALUES,&isarray[i]);CHKERRQ(ierr); 76486e683305SStefano Zampini /* ierr = ISView(isarray[i],0);CHKERRQ(ierr); */ 76496e683305SStefano Zampini } 76506e683305SStefano Zampini /* neumann boundaries */ 76516e683305SStefano Zampini if (pcbddc->NeumannBoundariesLocal) { 76526e683305SStefano Zampini /* ierr = ISView(pcbddc->NeumannBoundariesLocal,0);CHKERRQ(ierr); */ 76536e683305SStefano Zampini ierr = ISGetLocalSize(pcbddc->NeumannBoundariesLocal,&tsize);CHKERRQ(ierr); 76546e683305SStefano Zampini ierr = ISGetIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 76556e683305SStefano Zampini ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr); 76566e683305SStefano Zampini ierr = ISRestoreIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 76576e683305SStefano Zampini ierr = ISLocalToGlobalMappingApply(coarse_islg,nout,tidxs,tidxs2);CHKERRQ(ierr); 765830368db7SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),nout,tidxs2,PETSC_COPY_VALUES,&isarray[nisdofs]);CHKERRQ(ierr); 76596e683305SStefano Zampini /* ierr = ISView(isarray[nisdofs],0);CHKERRQ(ierr); */ 76606e683305SStefano Zampini } 76616e683305SStefano Zampini /* free memory */ 76626e683305SStefano Zampini ierr = PetscFree(tidxs);CHKERRQ(ierr); 76636e683305SStefano Zampini ierr = PetscFree(tidxs2);CHKERRQ(ierr); 76646e683305SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&tmap);CHKERRQ(ierr); 76656e683305SStefano Zampini } else { 76666e683305SStefano Zampini nis = 0; 76676e683305SStefano Zampini nisdofs = 0; 76686e683305SStefano Zampini nisneu = 0; 766930368db7SStefano Zampini nisvert = 0; 76706e683305SStefano Zampini isarray = NULL; 76716e683305SStefano Zampini } 76726e683305SStefano Zampini /* destroy no longer needed map */ 76736e683305SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&coarse_islg);CHKERRQ(ierr); 76746e683305SStefano Zampini 767557de7509SStefano Zampini /* subassemble */ 767657de7509SStefano Zampini if (multilevel_allowed) { 76771ae86dd6SStefano Zampini Vec vp[1]; 76781ae86dd6SStefano Zampini PetscInt nvecs = 0; 767957de7509SStefano Zampini PetscBool reuse,reuser; 76801ae86dd6SStefano Zampini 768157de7509SStefano Zampini if (coarse_mat) reuse = PETSC_TRUE; 768257de7509SStefano Zampini else reuse = PETSC_FALSE; 768357de7509SStefano Zampini ierr = MPIU_Allreduce(&reuse,&reuser,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 76841ae86dd6SStefano Zampini vp[0] = NULL; 76851ae86dd6SStefano Zampini if (pcbddc->benign_have_null) { /* propagate no-net-flux quadrature to coarser level */ 76861ae86dd6SStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pc),&vp[0]);CHKERRQ(ierr); 76871ae86dd6SStefano Zampini ierr = VecSetSizes(vp[0],pcbddc->local_primal_size,PETSC_DECIDE);CHKERRQ(ierr); 76881ae86dd6SStefano Zampini ierr = VecSetType(vp[0],VECSTANDARD);CHKERRQ(ierr); 76891ae86dd6SStefano Zampini nvecs = 1; 76901ae86dd6SStefano Zampini 76911ae86dd6SStefano Zampini if (pcbddc->divudotp) { 7692a198735bSStefano Zampini Mat B,loc_divudotp; 76931ae86dd6SStefano Zampini Vec v,p; 76941ae86dd6SStefano Zampini IS dummy; 76951ae86dd6SStefano Zampini PetscInt np; 76961ae86dd6SStefano Zampini 7697a198735bSStefano Zampini ierr = MatISGetLocalMat(pcbddc->divudotp,&loc_divudotp);CHKERRQ(ierr); 7698a198735bSStefano Zampini ierr = MatGetSize(loc_divudotp,&np,NULL);CHKERRQ(ierr); 76991ae86dd6SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,np,0,1,&dummy);CHKERRQ(ierr); 77007dae84e0SHong Zhang ierr = MatCreateSubMatrix(loc_divudotp,dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr); 77011ae86dd6SStefano Zampini ierr = MatCreateVecs(B,&v,&p);CHKERRQ(ierr); 77021ae86dd6SStefano Zampini ierr = VecSet(p,1.);CHKERRQ(ierr); 77031ae86dd6SStefano Zampini ierr = MatMultTranspose(B,p,v);CHKERRQ(ierr); 77041ae86dd6SStefano Zampini ierr = VecDestroy(&p);CHKERRQ(ierr); 77051ae86dd6SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 77061ae86dd6SStefano Zampini ierr = VecGetArray(vp[0],&array);CHKERRQ(ierr); 77071ae86dd6SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_P,array);CHKERRQ(ierr); 77081ae86dd6SStefano Zampini ierr = VecRestoreArray(vp[0],&array);CHKERRQ(ierr); 77091ae86dd6SStefano Zampini ierr = MatMultTranspose(pcbddc->coarse_phi_B,v,pcbddc->vec1_P);CHKERRQ(ierr); 77101ae86dd6SStefano Zampini ierr = VecResetArray(pcbddc->vec1_P);CHKERRQ(ierr); 77111ae86dd6SStefano Zampini ierr = ISDestroy(&dummy);CHKERRQ(ierr); 77121ae86dd6SStefano Zampini ierr = VecDestroy(&v);CHKERRQ(ierr); 771374e2c79eSStefano Zampini } 77141ae86dd6SStefano Zampini } 77151ae86dd6SStefano Zampini if (reuser) { 77161e0482f5SStefano Zampini ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_TRUE,&coarse_mat,nis,isarray,nvecs,vp);CHKERRQ(ierr); 771774e2c79eSStefano Zampini } else { 77181e0482f5SStefano Zampini ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_FALSE,&coarse_mat_is,nis,isarray,nvecs,vp);CHKERRQ(ierr); 77191ae86dd6SStefano Zampini } 77201ae86dd6SStefano Zampini if (vp[0]) { /* vp[0] could have been placed on a different set of processes */ 77211ae86dd6SStefano Zampini PetscScalar *arraym,*arrayv; 77221ae86dd6SStefano Zampini PetscInt nl; 77231ae86dd6SStefano Zampini ierr = VecGetLocalSize(vp[0],&nl);CHKERRQ(ierr); 77241ae86dd6SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,1,nl,NULL,&coarsedivudotp);CHKERRQ(ierr); 77251ae86dd6SStefano Zampini ierr = MatDenseGetArray(coarsedivudotp,&arraym);CHKERRQ(ierr); 77261ae86dd6SStefano Zampini ierr = VecGetArray(vp[0],&arrayv);CHKERRQ(ierr); 77271ae86dd6SStefano Zampini ierr = PetscMemcpy(arraym,arrayv,nl*sizeof(PetscScalar));CHKERRQ(ierr); 77281ae86dd6SStefano Zampini ierr = VecRestoreArray(vp[0],&arrayv);CHKERRQ(ierr); 77291ae86dd6SStefano Zampini ierr = MatDenseRestoreArray(coarsedivudotp,&arraym);CHKERRQ(ierr); 77301ae86dd6SStefano Zampini ierr = VecDestroy(&vp[0]);CHKERRQ(ierr); 7731a198735bSStefano Zampini } else { 7732a198735bSStefano Zampini ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,0,0,1,NULL,&coarsedivudotp);CHKERRQ(ierr); 77331ae86dd6SStefano Zampini } 77341ae86dd6SStefano Zampini } else { 77351e0482f5SStefano Zampini ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_FALSE,&coarse_mat_is,0,NULL,0,NULL);CHKERRQ(ierr); 77366e683305SStefano Zampini } 773757de7509SStefano Zampini if (coarse_mat_is || coarse_mat) { 773857de7509SStefano Zampini PetscMPIInt size; 7739f913dca9SStefano Zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)coarse_mat_is),&size);CHKERRQ(ierr); 774057de7509SStefano Zampini if (!multilevel_allowed) { 774157de7509SStefano Zampini ierr = MatISGetMPIXAIJ(coarse_mat_is,coarse_mat_reuse,&coarse_mat);CHKERRQ(ierr); 77426e683305SStefano Zampini } else { 774357de7509SStefano Zampini Mat A; 7744779c1cceSStefano Zampini 774557de7509SStefano Zampini /* if this matrix is present, it means we are not reusing the coarse matrix */ 774657de7509SStefano Zampini if (coarse_mat_is) { 774757de7509SStefano Zampini if (coarse_mat) SETERRQ(PetscObjectComm((PetscObject)coarse_mat_is),PETSC_ERR_PLIB,"This should not happen"); 774857de7509SStefano Zampini ierr = PetscObjectReference((PetscObject)coarse_mat_is);CHKERRQ(ierr); 774957de7509SStefano Zampini coarse_mat = coarse_mat_is; 775057de7509SStefano Zampini } 775157de7509SStefano Zampini /* be sure we don't have MatSeqDENSE as local mat */ 775257de7509SStefano Zampini ierr = MatISGetLocalMat(coarse_mat,&A);CHKERRQ(ierr); 775357de7509SStefano Zampini ierr = MatConvert(A,MATSEQAIJ,MAT_INPLACE_MATRIX,&A);CHKERRQ(ierr); 7754779c1cceSStefano Zampini } 7755779c1cceSStefano Zampini } 775657de7509SStefano Zampini ierr = MatDestroy(&t_coarse_mat_is);CHKERRQ(ierr); 775757de7509SStefano Zampini ierr = MatDestroy(&coarse_mat_is);CHKERRQ(ierr); 77586e683305SStefano Zampini 77596e683305SStefano Zampini /* create local to global scatters for coarse problem */ 776068457ee5SStefano Zampini if (compute_vecs) { 77616e683305SStefano Zampini PetscInt lrows; 77626e683305SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 776357de7509SStefano Zampini if (coarse_mat) { 776457de7509SStefano Zampini ierr = MatGetLocalSize(coarse_mat,&lrows,NULL);CHKERRQ(ierr); 77656e683305SStefano Zampini } else { 77666e683305SStefano Zampini lrows = 0; 77676e683305SStefano Zampini } 77686e683305SStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pc),&pcbddc->coarse_vec);CHKERRQ(ierr); 77696e683305SStefano Zampini ierr = VecSetSizes(pcbddc->coarse_vec,lrows,PETSC_DECIDE);CHKERRQ(ierr); 77706e683305SStefano Zampini ierr = VecSetType(pcbddc->coarse_vec,VECSTANDARD);CHKERRQ(ierr); 77716e683305SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 77726e683305SStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_P,NULL,pcbddc->coarse_vec,coarse_is,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 77736e683305SStefano Zampini } 77746e683305SStefano Zampini ierr = ISDestroy(&coarse_is);CHKERRQ(ierr); 7775c8587f34SStefano Zampini 7776f9eb5b7dSStefano Zampini /* set defaults for coarse KSP and PC */ 7777f9eb5b7dSStefano Zampini if (multilevel_allowed) { 7778f9eb5b7dSStefano Zampini coarse_ksp_type = KSPRICHARDSON; 7779f9eb5b7dSStefano Zampini coarse_pc_type = PCBDDC; 7780f9eb5b7dSStefano Zampini } else { 7781f9eb5b7dSStefano Zampini coarse_ksp_type = KSPPREONLY; 7782f9eb5b7dSStefano Zampini coarse_pc_type = PCREDUNDANT; 7783c8587f34SStefano Zampini } 7784c8587f34SStefano Zampini 77856e683305SStefano Zampini /* print some info if requested */ 77866e683305SStefano Zampini if (pcbddc->dbg_flag) { 77876e683305SStefano Zampini if (!multilevel_allowed) { 77886e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 77896e683305SStefano Zampini if (multilevel_requested) { 77906e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Not enough active processes on level %d (active processes %d, coarsening ratio %d)\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 77916e683305SStefano Zampini } else if (pcbddc->max_levels) { 77926e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Maximum number of requested levels reached (%d)\n",pcbddc->max_levels);CHKERRQ(ierr); 77936e683305SStefano Zampini } 77946e683305SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 77956e683305SStefano Zampini } 77966e683305SStefano Zampini } 77976e683305SStefano Zampini 77981e0482f5SStefano Zampini /* communicate coarse discrete gradient */ 77991e0482f5SStefano Zampini coarseG = NULL; 78001e0482f5SStefano Zampini if (pcbddc->nedcG && multilevel_allowed) { 78011e0482f5SStefano Zampini MPI_Comm ccomm; 78021e0482f5SStefano Zampini if (coarse_mat) { 78031e0482f5SStefano Zampini ccomm = PetscObjectComm((PetscObject)coarse_mat); 78041e0482f5SStefano Zampini } else { 78051e0482f5SStefano Zampini ccomm = MPI_COMM_NULL; 78061e0482f5SStefano Zampini } 78071e0482f5SStefano Zampini ierr = MatMPIAIJRestrict(pcbddc->nedcG,ccomm,&coarseG);CHKERRQ(ierr); 78081e0482f5SStefano Zampini } 78091e0482f5SStefano Zampini 7810f9eb5b7dSStefano Zampini /* create the coarse KSP object only once with defaults */ 781157de7509SStefano Zampini if (coarse_mat) { 78127274672aSStefano Zampini PetscBool isredundant,isnn,isbddc; 78136a1308c2SStefano Zampini PetscViewer dbg_viewer = NULL; 78147274672aSStefano Zampini 78156e683305SStefano Zampini if (pcbddc->dbg_flag) { 781657de7509SStefano Zampini dbg_viewer = PETSC_VIEWER_STDOUT_(PetscObjectComm((PetscObject)coarse_mat)); 78176e683305SStefano Zampini ierr = PetscViewerASCIIAddTab(dbg_viewer,2*pcbddc->current_level);CHKERRQ(ierr); 78186e683305SStefano Zampini } 7819f9eb5b7dSStefano Zampini if (!pcbddc->coarse_ksp) { 7820312be037SStefano Zampini char prefix[256],str_level[16]; 7821e604994aSStefano Zampini size_t len; 78221e0482f5SStefano Zampini 782357de7509SStefano Zampini ierr = KSPCreate(PetscObjectComm((PetscObject)coarse_mat),&pcbddc->coarse_ksp);CHKERRQ(ierr); 7824422a814eSBarry Smith ierr = KSPSetErrorIfNotConverged(pcbddc->coarse_ksp,pc->erroriffailure);CHKERRQ(ierr); 7825c8587f34SStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 7826f9eb5b7dSStefano Zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,1);CHKERRQ(ierr); 782757de7509SStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr); 7828c8587f34SStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 78296e683305SStefano Zampini ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr); 7830c8587f34SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 78311e0482f5SStefano Zampini /* TODO is this logic correct? should check for coarse_mat type */ 7832c8587f34SStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 7833e604994aSStefano Zampini /* prefix */ 7834e604994aSStefano Zampini ierr = PetscStrcpy(prefix,"");CHKERRQ(ierr); 7835e604994aSStefano Zampini ierr = PetscStrcpy(str_level,"");CHKERRQ(ierr); 7836e604994aSStefano Zampini if (!pcbddc->current_level) { 7837e604994aSStefano Zampini ierr = PetscStrcpy(prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr); 7838e604994aSStefano Zampini ierr = PetscStrcat(prefix,"pc_bddc_coarse_");CHKERRQ(ierr); 7839c8587f34SStefano Zampini } else { 7840e604994aSStefano Zampini ierr = PetscStrlen(((PetscObject)pc)->prefix,&len);CHKERRQ(ierr); 7841312be037SStefano Zampini if (pcbddc->current_level>1) len -= 3; /* remove "lX_" with X level number */ 7842312be037SStefano Zampini if (pcbddc->current_level>10) len -= 1; /* remove another char from level number */ 784334d6797cSStefano Zampini ierr = PetscStrncpy(prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr); 784435529e7bSStefano Zampini ierr = PetscSNPrintf(str_level,sizeof(str_level),"l%d_",(int)(pcbddc->current_level));CHKERRQ(ierr); 7845e604994aSStefano Zampini ierr = PetscStrcat(prefix,str_level);CHKERRQ(ierr); 7846e604994aSStefano Zampini } 7847e604994aSStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,prefix);CHKERRQ(ierr); 78483e3c6dadSStefano Zampini /* propagate BDDC info to the next level (these are dummy calls if pc_temp is not of type PCBDDC) */ 78493e3c6dadSStefano Zampini ierr = PCBDDCSetLevel(pc_temp,pcbddc->current_level+1);CHKERRQ(ierr); 78503e3c6dadSStefano Zampini ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr); 78513e3c6dadSStefano Zampini ierr = PCBDDCSetLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr); 7852f9eb5b7dSStefano Zampini /* allow user customization */ 7853f9eb5b7dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 78543e3c6dadSStefano Zampini } 78553e3c6dadSStefano Zampini /* propagate BDDC info to the next level (these are dummy calls if pc_temp is not of type PCBDDC) */ 785651bea450SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 78573e3c6dadSStefano Zampini if (nisdofs) { 78583e3c6dadSStefano Zampini ierr = PCBDDCSetDofsSplitting(pc_temp,nisdofs,isarray);CHKERRQ(ierr); 78593e3c6dadSStefano Zampini for (i=0;i<nisdofs;i++) { 78603e3c6dadSStefano Zampini ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr); 78613e3c6dadSStefano Zampini } 78623e3c6dadSStefano Zampini } 78633e3c6dadSStefano Zampini if (nisneu) { 78643e3c6dadSStefano Zampini ierr = PCBDDCSetNeumannBoundaries(pc_temp,isarray[nisdofs]);CHKERRQ(ierr); 78653e3c6dadSStefano Zampini ierr = ISDestroy(&isarray[nisdofs]);CHKERRQ(ierr); 7866312be037SStefano Zampini } 786730368db7SStefano Zampini if (nisvert) { 786830368db7SStefano Zampini ierr = PCBDDCSetPrimalVerticesIS(pc_temp,isarray[nis-1]);CHKERRQ(ierr); 786930368db7SStefano Zampini ierr = ISDestroy(&isarray[nis-1]);CHKERRQ(ierr); 787030368db7SStefano Zampini } 78711e0482f5SStefano Zampini if (coarseG) { 78721e0482f5SStefano Zampini ierr = PCBDDCSetDiscreteGradient(pc_temp,coarseG,1,nedcfield,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 78731e0482f5SStefano Zampini } 7874f9eb5b7dSStefano Zampini 7875f9eb5b7dSStefano Zampini /* get some info after set from options */ 7876f9eb5b7dSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr); 7877b76f3995Sstefano_zampini /* multilevel can only be requested via -pc_bddc_levels or PCBDDCSetLevels */ 7878b76f3995Sstefano_zampini if (isbddc && !multilevel_allowed) { 7879f9eb5b7dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 7880f9eb5b7dSStefano Zampini isbddc = PETSC_FALSE; 7881f9eb5b7dSStefano Zampini } 7882b76f3995Sstefano_zampini /* multilevel cannot be done with coarse PCs different from BDDC or NN */ 78837274672aSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCNN,&isnn);CHKERRQ(ierr); 78847274672aSStefano Zampini if (multilevel_requested && multilevel_allowed && !isbddc && !isnn) { 7885b76f3995Sstefano_zampini ierr = PCSetType(pc_temp,PCBDDC);CHKERRQ(ierr); 7886b76f3995Sstefano_zampini isbddc = PETSC_TRUE; 7887b76f3995Sstefano_zampini } 788839f0f02cSStefano Zampini ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr); 78897274672aSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCREDUNDANT,&isredundant);CHKERRQ(ierr); 78904f3a063dSStefano Zampini if (isredundant) { 78914f3a063dSStefano Zampini KSP inner_ksp; 78924f3a063dSStefano Zampini PC inner_pc; 78939326c5c6Sstefano_zampini 78944f3a063dSStefano Zampini ierr = PCRedundantGetKSP(pc_temp,&inner_ksp);CHKERRQ(ierr); 78954f3a063dSStefano Zampini ierr = KSPGetPC(inner_ksp,&inner_pc);CHKERRQ(ierr); 78964f3a063dSStefano Zampini ierr = PCFactorSetReuseFill(inner_pc,PETSC_TRUE);CHKERRQ(ierr); 78974f3a063dSStefano Zampini } 7898f9eb5b7dSStefano Zampini 789957de7509SStefano Zampini /* parameters which miss an API */ 79007274672aSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr); 790157de7509SStefano Zampini if (isbddc) { 7902720d30f9SStefano Zampini PC_BDDC* pcbddc_coarse = (PC_BDDC*)pc_temp->data; 79037274672aSStefano Zampini 7904720d30f9SStefano Zampini pcbddc_coarse->detect_disconnected = PETSC_TRUE; 790557de7509SStefano Zampini pcbddc_coarse->coarse_eqs_per_proc = pcbddc->coarse_eqs_per_proc; 790627b6a85dSStefano Zampini pcbddc_coarse->benign_saddle_point = pcbddc->benign_have_null; 790727b6a85dSStefano Zampini if (pcbddc_coarse->benign_saddle_point) { 7908a198735bSStefano Zampini Mat coarsedivudotp_is; 7909a198735bSStefano Zampini ISLocalToGlobalMapping l2gmap,rl2g,cl2g; 7910a198735bSStefano Zampini IS row,col; 7911a198735bSStefano Zampini const PetscInt *gidxs; 7912a198735bSStefano Zampini PetscInt n,st,M,N; 7913a198735bSStefano Zampini 7914a198735bSStefano Zampini ierr = MatGetSize(coarsedivudotp,&n,NULL);CHKERRQ(ierr); 7915a198735bSStefano Zampini ierr = MPI_Scan(&n,&st,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)coarse_mat));CHKERRQ(ierr); 7916a198735bSStefano Zampini st = st-n; 7917a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)coarse_mat),1,st,1,&row);CHKERRQ(ierr); 7918a198735bSStefano Zampini ierr = MatGetLocalToGlobalMapping(coarse_mat,&l2gmap,NULL);CHKERRQ(ierr); 7919a198735bSStefano Zampini ierr = ISLocalToGlobalMappingGetSize(l2gmap,&n);CHKERRQ(ierr); 7920a198735bSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(l2gmap,&gidxs);CHKERRQ(ierr); 7921a198735bSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)coarse_mat),n,gidxs,PETSC_COPY_VALUES,&col);CHKERRQ(ierr); 7922a198735bSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap,&gidxs);CHKERRQ(ierr); 7923a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(row,&rl2g);CHKERRQ(ierr); 7924a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(col,&cl2g);CHKERRQ(ierr); 7925a198735bSStefano Zampini ierr = ISGetSize(row,&M);CHKERRQ(ierr); 7926a198735bSStefano Zampini ierr = MatGetSize(coarse_mat,&N,NULL);CHKERRQ(ierr); 7927a198735bSStefano Zampini ierr = ISDestroy(&row);CHKERRQ(ierr); 7928a198735bSStefano Zampini ierr = ISDestroy(&col);CHKERRQ(ierr); 7929a198735bSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)coarse_mat),&coarsedivudotp_is);CHKERRQ(ierr); 7930a198735bSStefano Zampini ierr = MatSetType(coarsedivudotp_is,MATIS);CHKERRQ(ierr); 7931a198735bSStefano Zampini ierr = MatSetSizes(coarsedivudotp_is,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 7932a198735bSStefano Zampini ierr = MatSetLocalToGlobalMapping(coarsedivudotp_is,rl2g,cl2g);CHKERRQ(ierr); 7933a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&rl2g);CHKERRQ(ierr); 7934a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cl2g);CHKERRQ(ierr); 7935a198735bSStefano Zampini ierr = MatISSetLocalMat(coarsedivudotp_is,coarsedivudotp);CHKERRQ(ierr); 7936a198735bSStefano Zampini ierr = MatDestroy(&coarsedivudotp);CHKERRQ(ierr); 79378ae0ca82SStefano Zampini ierr = PCBDDCSetDivergenceMat(pc_temp,coarsedivudotp_is,PETSC_FALSE,NULL);CHKERRQ(ierr); 7938a198735bSStefano Zampini ierr = MatDestroy(&coarsedivudotp_is);CHKERRQ(ierr); 7939720d30f9SStefano Zampini pcbddc_coarse->adaptive_userdefined = PETSC_TRUE; 794059e48ca4SStefano Zampini if (pcbddc->adaptive_threshold < 1.0) pcbddc_coarse->deluxe_zerorows = PETSC_TRUE; 7941720d30f9SStefano Zampini } 7942d4d8cf7bSStefano Zampini } 79439881197aSStefano Zampini 79443301b35fSStefano Zampini /* propagate symmetry info of coarse matrix */ 79455a16e3a0SStefano Zampini ierr = MatSetOption(coarse_mat,MAT_STRUCTURALLY_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 79463301b35fSStefano Zampini if (pc->pmat->symmetric_set) { 79473301b35fSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_SYMMETRIC,pc->pmat->symmetric);CHKERRQ(ierr); 79483301b35fSStefano Zampini } 79493301b35fSStefano Zampini if (pc->pmat->hermitian_set) { 79503301b35fSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_HERMITIAN,pc->pmat->hermitian);CHKERRQ(ierr); 79513301b35fSStefano Zampini } 79523301b35fSStefano Zampini if (pc->pmat->spd_set) { 79533301b35fSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_SPD,pc->pmat->spd);CHKERRQ(ierr); 79543301b35fSStefano Zampini } 795527b6a85dSStefano Zampini if (pcbddc->benign_saddle_point && !pcbddc->benign_have_null) { 795627b6a85dSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_SPD,PETSC_TRUE);CHKERRQ(ierr); 795727b6a85dSStefano Zampini } 79586e683305SStefano Zampini /* set operators */ 79595f76c7aeSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr); 79606e683305SStefano Zampini if (pcbddc->dbg_flag) { 79616e683305SStefano Zampini ierr = PetscViewerASCIISubtractTab(dbg_viewer,2*pcbddc->current_level);CHKERRQ(ierr); 79626e683305SStefano Zampini } 79636e683305SStefano Zampini } 79641e0482f5SStefano Zampini ierr = MatDestroy(&coarseG);CHKERRQ(ierr); 79656e683305SStefano Zampini ierr = PetscFree(isarray);CHKERRQ(ierr); 7966b1ecc7b1SStefano Zampini #if 0 7967b9b85e73SStefano Zampini { 7968b9b85e73SStefano Zampini PetscViewer viewer; 7969b9b85e73SStefano Zampini char filename[256]; 7970b1ecc7b1SStefano Zampini sprintf(filename,"coarse_mat_level%d.m",pcbddc->current_level); 7971b1ecc7b1SStefano Zampini ierr = PetscViewerASCIIOpen(PetscObjectComm((PetscObject)coarse_mat),filename,&viewer);CHKERRQ(ierr); 79726a9046bcSBarry Smith ierr = PetscViewerPushFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 7973b9b85e73SStefano Zampini ierr = MatView(coarse_mat,viewer);CHKERRQ(ierr); 7974f159cad9SBarry Smith ierr = PetscViewerPopFormat(viewer);CHKERRQ(ierr); 7975b9b85e73SStefano Zampini ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 7976b9b85e73SStefano Zampini } 7977b9b85e73SStefano Zampini #endif 7978f9eb5b7dSStefano Zampini 797998a51de6SStefano Zampini if (pcbddc->coarse_ksp) { 798098a51de6SStefano Zampini Vec crhs,csol; 798104708bb6SStefano Zampini 7982f347579bSStefano Zampini ierr = KSPGetSolution(pcbddc->coarse_ksp,&csol);CHKERRQ(ierr); 7983f347579bSStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&crhs);CHKERRQ(ierr); 7984f347579bSStefano Zampini if (!csol) { 79852a7a6963SBarry Smith ierr = MatCreateVecs(coarse_mat,&((pcbddc->coarse_ksp)->vec_sol),NULL);CHKERRQ(ierr); 7986f9eb5b7dSStefano Zampini } 7987f347579bSStefano Zampini if (!crhs) { 79882a7a6963SBarry Smith ierr = MatCreateVecs(coarse_mat,NULL,&((pcbddc->coarse_ksp)->vec_rhs));CHKERRQ(ierr); 7989f347579bSStefano Zampini } 7990b0f5fe93SStefano Zampini } 79911ae86dd6SStefano Zampini ierr = MatDestroy(&coarsedivudotp);CHKERRQ(ierr); 7992b0f5fe93SStefano Zampini 7993b0f5fe93SStefano Zampini /* compute null space for coarse solver if the benign trick has been requested */ 7994b0f5fe93SStefano Zampini if (pcbddc->benign_null) { 7995b0f5fe93SStefano Zampini 7996b0f5fe93SStefano Zampini ierr = VecSet(pcbddc->vec1_P,0.);CHKERRQ(ierr); 79974f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 79984f1b2e48SStefano Zampini ierr = VecSetValue(pcbddc->vec1_P,pcbddc->local_primal_size-pcbddc->benign_n+i,1.0,INSERT_VALUES);CHKERRQ(ierr); 79994f1b2e48SStefano Zampini } 8000b0f5fe93SStefano Zampini ierr = VecAssemblyBegin(pcbddc->vec1_P);CHKERRQ(ierr); 8001b0f5fe93SStefano Zampini ierr = VecAssemblyEnd(pcbddc->vec1_P);CHKERRQ(ierr); 8002b0f5fe93SStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8003b0f5fe93SStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8004b0f5fe93SStefano Zampini if (coarse_mat) { 8005b0f5fe93SStefano Zampini Vec nullv; 8006b0f5fe93SStefano Zampini PetscScalar *array,*array2; 8007b0f5fe93SStefano Zampini PetscInt nl; 8008b0f5fe93SStefano Zampini 8009b0f5fe93SStefano Zampini ierr = MatCreateVecs(coarse_mat,&nullv,NULL);CHKERRQ(ierr); 8010b0f5fe93SStefano Zampini ierr = VecGetLocalSize(nullv,&nl);CHKERRQ(ierr); 8011b0f5fe93SStefano Zampini ierr = VecGetArrayRead(pcbddc->coarse_vec,(const PetscScalar**)&array);CHKERRQ(ierr); 8012b0f5fe93SStefano Zampini ierr = VecGetArray(nullv,&array2);CHKERRQ(ierr); 8013b0f5fe93SStefano Zampini ierr = PetscMemcpy(array2,array,nl*sizeof(*array));CHKERRQ(ierr); 8014b0f5fe93SStefano Zampini ierr = VecRestoreArray(nullv,&array2);CHKERRQ(ierr); 8015b0f5fe93SStefano Zampini ierr = VecRestoreArrayRead(pcbddc->coarse_vec,(const PetscScalar**)&array);CHKERRQ(ierr); 8016b0f5fe93SStefano Zampini ierr = VecNormalize(nullv,NULL);CHKERRQ(ierr); 8017b0f5fe93SStefano Zampini ierr = MatNullSpaceCreate(PetscObjectComm((PetscObject)coarse_mat),PETSC_FALSE,1,&nullv,&CoarseNullSpace);CHKERRQ(ierr); 8018b0f5fe93SStefano Zampini ierr = VecDestroy(&nullv);CHKERRQ(ierr); 8019b0f5fe93SStefano Zampini } 8020b0f5fe93SStefano Zampini } 8021b0f5fe93SStefano Zampini 8022b0f5fe93SStefano Zampini if (pcbddc->coarse_ksp) { 8023b0f5fe93SStefano Zampini PetscBool ispreonly; 8024b0f5fe93SStefano Zampini 8025b0f5fe93SStefano Zampini if (CoarseNullSpace) { 8026b0f5fe93SStefano Zampini PetscBool isnull; 8027b0f5fe93SStefano Zampini ierr = MatNullSpaceTest(CoarseNullSpace,coarse_mat,&isnull);CHKERRQ(ierr); 8028bef83e63SStefano Zampini if (isnull) { 8029b0f5fe93SStefano Zampini ierr = MatSetNullSpace(coarse_mat,CoarseNullSpace);CHKERRQ(ierr); 8030b0f5fe93SStefano Zampini } 8031bef83e63SStefano Zampini /* TODO: add local nullspaces (if any) */ 8032b0f5fe93SStefano Zampini } 8033b0f5fe93SStefano Zampini /* setup coarse ksp */ 8034b0f5fe93SStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 8035cbcc2c2aSStefano Zampini /* Check coarse problem if in debug mode or if solving with an iterative method */ 8036cbcc2c2aSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcbddc->coarse_ksp,KSPPREONLY,&ispreonly);CHKERRQ(ierr); 80376e683305SStefano Zampini if (pcbddc->dbg_flag || (!ispreonly && pcbddc->use_coarse_estimates) ) { 8038c8587f34SStefano Zampini KSP check_ksp; 80392b510759SStefano Zampini KSPType check_ksp_type; 8040c8587f34SStefano Zampini PC check_pc; 80416e683305SStefano Zampini Vec check_vec,coarse_vec; 80426a1308c2SStefano Zampini PetscReal abs_infty_error,infty_error,lambda_min=1.0,lambda_max=1.0; 80432b510759SStefano Zampini PetscInt its; 80446e683305SStefano Zampini PetscBool compute_eigs; 80456e683305SStefano Zampini PetscReal *eigs_r,*eigs_c; 80466e683305SStefano Zampini PetscInt neigs; 80478e185a42SStefano Zampini const char *prefix; 8048c8587f34SStefano Zampini 80492b510759SStefano Zampini /* Create ksp object suitable for estimation of extreme eigenvalues */ 80506e683305SStefano Zampini ierr = KSPCreate(PetscObjectComm((PetscObject)pcbddc->coarse_ksp),&check_ksp);CHKERRQ(ierr); 8051422a814eSBarry Smith ierr = KSPSetErrorIfNotConverged(pcbddc->coarse_ksp,pc->erroriffailure);CHKERRQ(ierr); 805223ee1639SBarry Smith ierr = KSPSetOperators(check_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr); 8053f4ddd8eeSStefano Zampini ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 8054e4d548c7SStefano Zampini /* prevent from setup unneeded object */ 8055e4d548c7SStefano Zampini ierr = KSPGetPC(check_ksp,&check_pc);CHKERRQ(ierr); 8056e4d548c7SStefano Zampini ierr = PCSetType(check_pc,PCNONE);CHKERRQ(ierr); 80572b510759SStefano Zampini if (ispreonly) { 80582b510759SStefano Zampini check_ksp_type = KSPPREONLY; 80596e683305SStefano Zampini compute_eigs = PETSC_FALSE; 80602b510759SStefano Zampini } else { 8061cbcc2c2aSStefano Zampini check_ksp_type = KSPGMRES; 80626e683305SStefano Zampini compute_eigs = PETSC_TRUE; 8063c8587f34SStefano Zampini } 8064c8587f34SStefano Zampini ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr); 80656e683305SStefano Zampini ierr = KSPSetComputeSingularValues(check_ksp,compute_eigs);CHKERRQ(ierr); 80666e683305SStefano Zampini ierr = KSPSetComputeEigenvalues(check_ksp,compute_eigs);CHKERRQ(ierr); 80676e683305SStefano Zampini ierr = KSPGMRESSetRestart(check_ksp,pcbddc->coarse_size+1);CHKERRQ(ierr); 8068a7dc3881SStefano Zampini ierr = KSPGetOptionsPrefix(pcbddc->coarse_ksp,&prefix);CHKERRQ(ierr); 8069a7dc3881SStefano Zampini ierr = KSPSetOptionsPrefix(check_ksp,prefix);CHKERRQ(ierr); 8070a7dc3881SStefano Zampini ierr = KSPAppendOptionsPrefix(check_ksp,"check_");CHKERRQ(ierr); 8071a7dc3881SStefano Zampini ierr = KSPSetFromOptions(check_ksp);CHKERRQ(ierr); 8072c8587f34SStefano Zampini ierr = KSPSetUp(check_ksp);CHKERRQ(ierr); 8073c8587f34SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr); 8074c8587f34SStefano Zampini ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr); 8075c8587f34SStefano Zampini /* create random vec */ 80762701bc32SStefano Zampini ierr = MatCreateVecs(coarse_mat,&coarse_vec,&check_vec);CHKERRQ(ierr); 8077c8587f34SStefano Zampini ierr = VecSetRandom(check_vec,NULL);CHKERRQ(ierr); 80786e683305SStefano Zampini ierr = MatMult(coarse_mat,check_vec,coarse_vec);CHKERRQ(ierr); 8079c8587f34SStefano Zampini /* solve coarse problem */ 80806e683305SStefano Zampini ierr = KSPSolve(check_ksp,coarse_vec,coarse_vec);CHKERRQ(ierr); 8081cbcc2c2aSStefano Zampini /* set eigenvalue estimation if preonly has not been requested */ 80826e683305SStefano Zampini if (compute_eigs) { 8083854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->coarse_size+1,&eigs_r);CHKERRQ(ierr); 8084854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->coarse_size+1,&eigs_c);CHKERRQ(ierr); 80856e683305SStefano Zampini ierr = KSPComputeEigenvalues(check_ksp,pcbddc->coarse_size+1,eigs_r,eigs_c,&neigs);CHKERRQ(ierr); 80861ae86dd6SStefano Zampini if (neigs) { 80876e683305SStefano Zampini lambda_max = eigs_r[neigs-1]; 80886e683305SStefano Zampini lambda_min = eigs_r[0]; 80896e683305SStefano Zampini if (pcbddc->use_coarse_estimates) { 80902701bc32SStefano Zampini if (lambda_max>=lambda_min) { /* using PETSC_SMALL since lambda_max == lambda_min is not allowed by KSPChebyshevSetEigenvalues */ 80912701bc32SStefano Zampini ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max+PETSC_SMALL,lambda_min);CHKERRQ(ierr); 8092cbcc2c2aSStefano Zampini ierr = KSPRichardsonSetScale(pcbddc->coarse_ksp,2.0/(lambda_max+lambda_min));CHKERRQ(ierr); 8093cbcc2c2aSStefano Zampini } 8094c8587f34SStefano Zampini } 8095c8587f34SStefano Zampini } 80961ae86dd6SStefano Zampini } 8097cbcc2c2aSStefano Zampini 8098c8587f34SStefano Zampini /* check coarse problem residual error */ 80996e683305SStefano Zampini if (pcbddc->dbg_flag) { 81006e683305SStefano Zampini PetscViewer dbg_viewer = PETSC_VIEWER_STDOUT_(PetscObjectComm((PetscObject)pcbddc->coarse_ksp)); 81016e683305SStefano Zampini ierr = PetscViewerASCIIAddTab(dbg_viewer,2*(pcbddc->current_level+1));CHKERRQ(ierr); 81026e683305SStefano Zampini ierr = VecAXPY(check_vec,-1.0,coarse_vec);CHKERRQ(ierr); 8103c8587f34SStefano Zampini ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 81046e683305SStefano Zampini ierr = MatMult(coarse_mat,check_vec,coarse_vec);CHKERRQ(ierr); 81056e683305SStefano Zampini ierr = VecNorm(coarse_vec,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr); 8106779c1cceSStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem details (use estimates %d)\n",pcbddc->use_coarse_estimates);CHKERRQ(ierr); 81076e683305SStefano Zampini ierr = PetscObjectPrintClassNamePrefixType((PetscObject)(pcbddc->coarse_ksp),dbg_viewer);CHKERRQ(ierr); 81086e683305SStefano Zampini ierr = PetscObjectPrintClassNamePrefixType((PetscObject)(check_pc),dbg_viewer);CHKERRQ(ierr); 81096e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem exact infty_error : %1.6e\n",infty_error);CHKERRQ(ierr); 81106e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem residual infty_error: %1.6e\n",abs_infty_error);CHKERRQ(ierr); 8111b0f5fe93SStefano Zampini if (CoarseNullSpace) { 8112b0f5fe93SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem is singular\n");CHKERRQ(ierr); 8113b0f5fe93SStefano Zampini } 81146e683305SStefano Zampini if (compute_eigs) { 81156e683305SStefano Zampini PetscReal lambda_max_s,lambda_min_s; 8116b03ebc13SStefano Zampini KSPConvergedReason reason; 8117deec49d1SStefano Zampini ierr = KSPGetType(check_ksp,&check_ksp_type);CHKERRQ(ierr); 8118c8587f34SStefano Zampini ierr = KSPGetIterationNumber(check_ksp,&its);CHKERRQ(ierr); 8119b03ebc13SStefano Zampini ierr = KSPGetConvergedReason(check_ksp,&reason);CHKERRQ(ierr); 81206e683305SStefano Zampini ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max_s,&lambda_min_s);CHKERRQ(ierr); 8121b03ebc13SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem eigenvalues (estimated with %d iterations of %s, conv reason %d): %1.6e %1.6e (%1.6e %1.6e)\n",its,check_ksp_type,reason,lambda_min,lambda_max,lambda_min_s,lambda_max_s);CHKERRQ(ierr); 81226e683305SStefano Zampini for (i=0;i<neigs;i++) { 81236e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"%1.6e %1.6ei\n",eigs_r[i],eigs_c[i]);CHKERRQ(ierr); 8124c8587f34SStefano Zampini } 81256e683305SStefano Zampini } 81266e683305SStefano Zampini ierr = PetscViewerFlush(dbg_viewer);CHKERRQ(ierr); 81276e683305SStefano Zampini ierr = PetscViewerASCIISubtractTab(dbg_viewer,2*(pcbddc->current_level+1));CHKERRQ(ierr); 81286e683305SStefano Zampini } 8129e4d548c7SStefano Zampini ierr = VecDestroy(&check_vec);CHKERRQ(ierr); 81302701bc32SStefano Zampini ierr = VecDestroy(&coarse_vec);CHKERRQ(ierr); 8131c8587f34SStefano Zampini ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr); 81326e683305SStefano Zampini if (compute_eigs) { 81336e683305SStefano Zampini ierr = PetscFree(eigs_r);CHKERRQ(ierr); 81346e683305SStefano Zampini ierr = PetscFree(eigs_c);CHKERRQ(ierr); 8135c8587f34SStefano Zampini } 81366e683305SStefano Zampini } 81376e683305SStefano Zampini } 8138bef83e63SStefano Zampini ierr = MatNullSpaceDestroy(&CoarseNullSpace);CHKERRQ(ierr); 8139cbcc2c2aSStefano Zampini /* print additional info */ 8140cbcc2c2aSStefano Zampini if (pcbddc->dbg_flag) { 81416e683305SStefano Zampini /* waits until all processes reaches this point */ 81426e683305SStefano Zampini ierr = PetscBarrier((PetscObject)pc);CHKERRQ(ierr); 8143cbcc2c2aSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Coarse solver setup completed at level %d\n",pcbddc->current_level);CHKERRQ(ierr); 8144cbcc2c2aSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8145cbcc2c2aSStefano Zampini } 8146cbcc2c2aSStefano Zampini 81472b510759SStefano Zampini /* free memory */ 8148fdc635d7SStefano Zampini ierr = MatDestroy(&coarse_mat);CHKERRQ(ierr); 8149c8587f34SStefano Zampini PetscFunctionReturn(0); 8150c8587f34SStefano Zampini } 8151674ae819SStefano Zampini 8152f34684f1SStefano Zampini PetscErrorCode PCBDDCComputePrimalNumbering(PC pc,PetscInt* coarse_size_n,PetscInt** local_primal_indices_n) 8153f34684f1SStefano Zampini { 8154f34684f1SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 8155f34684f1SStefano Zampini PC_IS* pcis = (PC_IS*)pc->data; 8156f34684f1SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 8157dc456d91SStefano Zampini IS subset,subset_mult,subset_n; 8158dc456d91SStefano Zampini PetscInt local_size,coarse_size=0; 815973be2a3aSStefano Zampini PetscInt *local_primal_indices=NULL; 8160dc456d91SStefano Zampini const PetscInt *t_local_primal_indices; 8161f34684f1SStefano Zampini PetscErrorCode ierr; 8162f34684f1SStefano Zampini 8163f34684f1SStefano Zampini PetscFunctionBegin; 8164f34684f1SStefano Zampini /* Compute global number of coarse dofs */ 81656c4ed002SBarry Smith if (pcbddc->local_primal_size && !pcbddc->local_primal_ref_node) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"BDDC ConstraintsSetUp should be called first"); 8166dc456d91SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(pc->pmat)),pcbddc->local_primal_size_cc,pcbddc->local_primal_ref_node,PETSC_COPY_VALUES,&subset_n);CHKERRQ(ierr); 81673bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pcis->mapping,subset_n,&subset);CHKERRQ(ierr); 8168dc456d91SStefano Zampini ierr = ISDestroy(&subset_n);CHKERRQ(ierr); 8169dc456d91SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(pc->pmat)),pcbddc->local_primal_size_cc,pcbddc->local_primal_ref_mult,PETSC_COPY_VALUES,&subset_mult);CHKERRQ(ierr); 81706583bcc1SStefano Zampini ierr = ISRenumber(subset,subset_mult,&coarse_size,&subset_n);CHKERRQ(ierr); 8171dc456d91SStefano Zampini ierr = ISDestroy(&subset);CHKERRQ(ierr); 8172dc456d91SStefano Zampini ierr = ISDestroy(&subset_mult);CHKERRQ(ierr); 8173dc456d91SStefano Zampini ierr = ISGetLocalSize(subset_n,&local_size);CHKERRQ(ierr); 81746c4ed002SBarry Smith if (local_size != pcbddc->local_primal_size) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Invalid number of local primal indices computed %D != %D",local_size,pcbddc->local_primal_size); 8175dc456d91SStefano Zampini ierr = PetscMalloc1(local_size,&local_primal_indices);CHKERRQ(ierr); 8176dc456d91SStefano Zampini ierr = ISGetIndices(subset_n,&t_local_primal_indices);CHKERRQ(ierr); 8177dc456d91SStefano Zampini ierr = PetscMemcpy(local_primal_indices,t_local_primal_indices,local_size*sizeof(PetscInt));CHKERRQ(ierr); 8178dc456d91SStefano Zampini ierr = ISRestoreIndices(subset_n,&t_local_primal_indices);CHKERRQ(ierr); 8179dc456d91SStefano Zampini ierr = ISDestroy(&subset_n);CHKERRQ(ierr); 8180f34684f1SStefano Zampini 8181f34684f1SStefano Zampini /* check numbering */ 8182f34684f1SStefano Zampini if (pcbddc->dbg_flag) { 8183019a44ceSStefano Zampini PetscScalar coarsesum,*array,*array2; 8184dc456d91SStefano Zampini PetscInt i; 8185b9b85e73SStefano Zampini PetscBool set_error = PETSC_FALSE,set_error_reduced = PETSC_FALSE; 8186f34684f1SStefano Zampini 8187f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8188f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 8189f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check coarse indices\n");CHKERRQ(ierr); 81901575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8191019a44ceSStefano Zampini /* counter */ 8192019a44ceSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 8193019a44ceSStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 8194019a44ceSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8195019a44ceSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8196019a44ceSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8197019a44ceSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8198f34684f1SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 8199f34684f1SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 8200727cdba6SStefano Zampini ierr = VecSetValue(pcis->vec1_N,pcbddc->primal_indices_local_idxs[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 8201f34684f1SStefano Zampini } 8202f34684f1SStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 8203f34684f1SStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 8204f34684f1SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 8205e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8206e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8207e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8208e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8209f34684f1SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8210019a44ceSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 8211f34684f1SStefano Zampini for (i=0;i<pcis->n;i++) { 8212019a44ceSStefano Zampini if (array[i] != 0.0 && array[i] != array2[i]) { 82132c66d082SStefano Zampini PetscInt owned = (PetscInt)PetscRealPart(array[i]),gi; 821475c01103SStefano Zampini PetscInt neigh = (PetscInt)PetscRealPart(array2[i]); 8215b9b85e73SStefano Zampini set_error = PETSC_TRUE; 82162c66d082SStefano Zampini ierr = ISLocalToGlobalMappingApply(pcis->mapping,1,&i,&gi);CHKERRQ(ierr); 82172c66d082SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d: local index %d (gid %d) owned by %d processes instead of %d!\n",PetscGlobalRank,i,gi,owned,neigh);CHKERRQ(ierr); 8218f34684f1SStefano Zampini } 8219f34684f1SStefano Zampini } 8220019a44ceSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 8221b2566f29SBarry Smith ierr = MPIU_Allreduce(&set_error,&set_error_reduced,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 8222f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8223f34684f1SStefano Zampini for (i=0;i<pcis->n;i++) { 8224f34684f1SStefano Zampini if (PetscRealPart(array[i]) > 0.0) array[i] = 1.0/PetscRealPart(array[i]); 8225f34684f1SStefano Zampini } 8226f34684f1SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8227f34684f1SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 8228e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8229e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8230f34684f1SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 8231f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Size of coarse problem is %d (%lf)\n",coarse_size,PetscRealPart(coarsesum));CHKERRQ(ierr); 8232b9b85e73SStefano Zampini if (pcbddc->dbg_flag > 1 || set_error_reduced) { 8233ca8b9ea9SStefano Zampini PetscInt *gidxs; 8234ca8b9ea9SStefano Zampini 8235ca8b9ea9SStefano Zampini ierr = PetscMalloc1(pcbddc->local_primal_size,&gidxs);CHKERRQ(ierr); 82363bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingApply(pcis->mapping,pcbddc->local_primal_size,pcbddc->primal_indices_local_idxs,gidxs);CHKERRQ(ierr); 8237f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Distribution of local primal indices\n");CHKERRQ(ierr); 8238f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8239f34684f1SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 8240f34684f1SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 82414bc2dc4bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"local_primal_indices[%d]=%d (%d,%d)\n",i,local_primal_indices[i],pcbddc->primal_indices_local_idxs[i],gidxs[i]);CHKERRQ(ierr); 8242f34684f1SStefano Zampini } 8243f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8244ca8b9ea9SStefano Zampini ierr = PetscFree(gidxs);CHKERRQ(ierr); 8245f34684f1SStefano Zampini } 8246f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 82471575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8248302440fdSBarry Smith if (set_error_reduced) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"BDDC Numbering of coarse dofs failed"); 8249f34684f1SStefano Zampini } 82508bec7fa6SStefano Zampini /* ierr = PetscPrintf(PetscObjectComm((PetscObject)pc),"Size of coarse problem is %d\n",coarse_size);CHKERRQ(ierr); */ 8251f34684f1SStefano Zampini /* get back data */ 8252f34684f1SStefano Zampini *coarse_size_n = coarse_size; 8253f34684f1SStefano Zampini *local_primal_indices_n = local_primal_indices; 8254674ae819SStefano Zampini PetscFunctionReturn(0); 8255674ae819SStefano Zampini } 8256674ae819SStefano Zampini 8257a7dc3881SStefano Zampini PetscErrorCode PCBDDCGlobalToLocal(VecScatter g2l_ctx,Vec gwork, Vec lwork, IS globalis, IS* localis) 8258e456f2a8SStefano Zampini { 8259e456f2a8SStefano Zampini IS localis_t; 8260a7dc3881SStefano Zampini PetscInt i,lsize,*idxs,n; 8261e456f2a8SStefano Zampini PetscScalar *vals; 8262e456f2a8SStefano Zampini PetscErrorCode ierr; 8263e456f2a8SStefano Zampini 8264e456f2a8SStefano Zampini PetscFunctionBegin; 8265a7dc3881SStefano Zampini /* get indices in local ordering exploiting local to global map */ 8266e456f2a8SStefano Zampini ierr = ISGetLocalSize(globalis,&lsize);CHKERRQ(ierr); 8267854ce69bSBarry Smith ierr = PetscMalloc1(lsize,&vals);CHKERRQ(ierr); 8268e456f2a8SStefano Zampini for (i=0;i<lsize;i++) vals[i] = 1.0; 8269e456f2a8SStefano Zampini ierr = ISGetIndices(globalis,(const PetscInt**)&idxs);CHKERRQ(ierr); 8270a7dc3881SStefano Zampini ierr = VecSet(gwork,0.0);CHKERRQ(ierr); 8271a7dc3881SStefano Zampini ierr = VecSet(lwork,0.0);CHKERRQ(ierr); 82721035eff8SStefano Zampini if (idxs) { /* multilevel guard */ 8273a7dc3881SStefano Zampini ierr = VecSetValues(gwork,lsize,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 82741035eff8SStefano Zampini } 8275a7dc3881SStefano Zampini ierr = VecAssemblyBegin(gwork);CHKERRQ(ierr); 8276e456f2a8SStefano Zampini ierr = ISRestoreIndices(globalis,(const PetscInt**)&idxs);CHKERRQ(ierr); 8277e456f2a8SStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 8278a7dc3881SStefano Zampini ierr = VecAssemblyEnd(gwork);CHKERRQ(ierr); 8279a7dc3881SStefano Zampini /* now compute set in local ordering */ 8280a7dc3881SStefano Zampini ierr = VecScatterBegin(g2l_ctx,gwork,lwork,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8281a7dc3881SStefano Zampini ierr = VecScatterEnd(g2l_ctx,gwork,lwork,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8282a7dc3881SStefano Zampini ierr = VecGetArrayRead(lwork,(const PetscScalar**)&vals);CHKERRQ(ierr); 8283a7dc3881SStefano Zampini ierr = VecGetSize(lwork,&n);CHKERRQ(ierr); 8284a7dc3881SStefano Zampini for (i=0,lsize=0;i<n;i++) { 8285ff92baa0SMatthew G. Knepley if (PetscRealPart(vals[i]) > 0.5) { 8286e456f2a8SStefano Zampini lsize++; 8287e456f2a8SStefano Zampini } 8288e456f2a8SStefano Zampini } 8289854ce69bSBarry Smith ierr = PetscMalloc1(lsize,&idxs);CHKERRQ(ierr); 8290a7dc3881SStefano Zampini for (i=0,lsize=0;i<n;i++) { 8291ff92baa0SMatthew G. Knepley if (PetscRealPart(vals[i]) > 0.5) { 8292e456f2a8SStefano Zampini idxs[lsize++] = i; 8293e456f2a8SStefano Zampini } 8294e456f2a8SStefano Zampini } 8295a7dc3881SStefano Zampini ierr = VecRestoreArrayRead(lwork,(const PetscScalar**)&vals);CHKERRQ(ierr); 8296a7dc3881SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)gwork),lsize,idxs,PETSC_OWN_POINTER,&localis_t);CHKERRQ(ierr); 8297e456f2a8SStefano Zampini *localis = localis_t; 8298e456f2a8SStefano Zampini PetscFunctionReturn(0); 8299e456f2a8SStefano Zampini } 8300906d46d4SStefano Zampini 830108122e43SStefano Zampini PetscErrorCode PCBDDCSetUpSubSchurs(PC pc) 8302b96c3477SStefano Zampini { 8303a64f4aa4SStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 8304b96c3477SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 8305b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs=pcbddc->sub_schurs; 8306a64f4aa4SStefano Zampini Mat S_j; 8307b96c3477SStefano Zampini PetscInt *used_xadj,*used_adjncy; 8308b96c3477SStefano Zampini PetscBool free_used_adj; 8309b96c3477SStefano Zampini PetscErrorCode ierr; 8310b96c3477SStefano Zampini 8311b96c3477SStefano Zampini PetscFunctionBegin; 8312b96c3477SStefano Zampini /* decide the adjacency to be used for determining internal problems for local schur on subsets */ 8313b96c3477SStefano Zampini free_used_adj = PETSC_FALSE; 831408122e43SStefano Zampini if (pcbddc->sub_schurs_layers == -1) { 8315b96c3477SStefano Zampini used_xadj = NULL; 8316b96c3477SStefano Zampini used_adjncy = NULL; 8317b96c3477SStefano Zampini } else { 831808122e43SStefano Zampini if (pcbddc->sub_schurs_use_useradj && pcbddc->mat_graph->xadj) { 831908122e43SStefano Zampini used_xadj = pcbddc->mat_graph->xadj; 832008122e43SStefano Zampini used_adjncy = pcbddc->mat_graph->adjncy; 832108122e43SStefano Zampini } else if (pcbddc->computed_rowadj) { 8322b96c3477SStefano Zampini used_xadj = pcbddc->mat_graph->xadj; 8323b96c3477SStefano Zampini used_adjncy = pcbddc->mat_graph->adjncy; 8324b96c3477SStefano Zampini } else { 83252fffb893SStefano Zampini PetscBool flg_row=PETSC_FALSE; 8326b96c3477SStefano Zampini const PetscInt *xadj,*adjncy; 8327b96c3477SStefano Zampini PetscInt nvtxs; 8328b96c3477SStefano Zampini 83292fffb893SStefano Zampini ierr = MatGetRowIJ(pcbddc->local_mat,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 83302fffb893SStefano Zampini if (flg_row) { 8331b96c3477SStefano Zampini ierr = PetscMalloc2(nvtxs+1,&used_xadj,xadj[nvtxs],&used_adjncy);CHKERRQ(ierr); 8332b96c3477SStefano Zampini ierr = PetscMemcpy(used_xadj,xadj,(nvtxs+1)*sizeof(*xadj));CHKERRQ(ierr); 8333b96c3477SStefano Zampini ierr = PetscMemcpy(used_adjncy,adjncy,(xadj[nvtxs])*sizeof(*adjncy));CHKERRQ(ierr); 8334b96c3477SStefano Zampini free_used_adj = PETSC_TRUE; 83352fffb893SStefano Zampini } else { 83362fffb893SStefano Zampini pcbddc->sub_schurs_layers = -1; 83372fffb893SStefano Zampini used_xadj = NULL; 83382fffb893SStefano Zampini used_adjncy = NULL; 83392fffb893SStefano Zampini } 83402fffb893SStefano Zampini ierr = MatRestoreRowIJ(pcbddc->local_mat,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 8341b96c3477SStefano Zampini } 8342b96c3477SStefano Zampini } 8343d5574798SStefano Zampini 8344d5574798SStefano Zampini /* setup sub_schurs data */ 8345a64f4aa4SStefano Zampini ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr); 8346df4d28bfSStefano Zampini if (!sub_schurs->schur_explicit) { 8347df4d28bfSStefano Zampini /* pcbddc->ksp_D up to date only if not using MatFactor with Schur complement support */ 8348a64f4aa4SStefano Zampini ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr); 834991af6908SStefano Zampini ierr = PCBDDCSubSchursSetUp(sub_schurs,NULL,S_j,PETSC_FALSE,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,NULL,pcbddc->adaptive_selection,PETSC_FALSE,PETSC_FALSE,0,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 8350a64f4aa4SStefano Zampini } else { 835172b8c272SStefano Zampini Mat change = NULL; 83529d54b7f4SStefano Zampini Vec scaling = NULL; 8353111315fdSstefano_zampini IS change_primal = NULL, iP; 8354111315fdSstefano_zampini PetscInt benign_n; 8355111315fdSstefano_zampini PetscBool reuse_solvers = (PetscBool)!pcbddc->use_change_of_basis; 8356111315fdSstefano_zampini PetscBool isseqaij,need_change = PETSC_FALSE; 8357111315fdSstefano_zampini PetscBool discrete_harmonic = PETSC_FALSE; 8358a3df083aSStefano Zampini 83595feab87aSStefano Zampini if (!pcbddc->use_vertices && reuse_solvers) { 83605feab87aSStefano Zampini PetscInt n_vertices; 83615feab87aSStefano Zampini 83625feab87aSStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_vertices,&n_vertices);CHKERRQ(ierr); 83632034aafcSStefano Zampini reuse_solvers = (PetscBool)!n_vertices; 83645feab87aSStefano Zampini } 836504708bb6SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcbddc->local_mat,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 836604708bb6SStefano Zampini if (!isseqaij) { 836704708bb6SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 836804708bb6SStefano Zampini if (matis->A == pcbddc->local_mat) { 836904708bb6SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 837004708bb6SStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 837104708bb6SStefano Zampini } else { 8372511c6705SHong Zhang ierr = MatConvert(pcbddc->local_mat,MATSEQAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 837304708bb6SStefano Zampini } 837404708bb6SStefano Zampini } 8375a3df083aSStefano Zampini if (!pcbddc->benign_change_explicit) { 8376a3df083aSStefano Zampini benign_n = pcbddc->benign_n; 8377ca92afb2SStefano Zampini } else { 8378a3df083aSStefano Zampini benign_n = 0; 8379ca92afb2SStefano Zampini } 8380b7ab4a40SStefano Zampini /* sub_schurs->change is a local object; instead, PCBDDCConstraintsSetUp and the quantities used in the test below are logically collective on pc. 8381b7ab4a40SStefano Zampini We need a global reduction to avoid possible deadlocks. 8382b7ab4a40SStefano Zampini We assume that sub_schurs->change is created once, and then reused for different solves, unless the topography has been recomputed */ 838372b8c272SStefano Zampini if (pcbddc->adaptive_userdefined || (pcbddc->deluxe_zerorows && !pcbddc->use_change_of_basis)) { 838422db5ddcSStefano Zampini PetscBool have_loc_change = (PetscBool)(!!sub_schurs->change); 8385b7ab4a40SStefano Zampini ierr = MPIU_Allreduce(&have_loc_change,&need_change,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 838622db5ddcSStefano Zampini need_change = (PetscBool)(!need_change); 8387b7ab4a40SStefano Zampini } 8388b7ab4a40SStefano Zampini /* If the user defines additional constraints, we import them here. 8389b7ab4a40SStefano Zampini We need to compute the change of basis according to the quadrature weights attached to pmat via MatSetNearNullSpace, and this could not be done (at the moment) without some hacking */ 8390b7ab4a40SStefano Zampini if (need_change) { 839188c03ad3SStefano Zampini PC_IS *pcisf; 839288c03ad3SStefano Zampini PC_BDDC *pcbddcf; 839388c03ad3SStefano Zampini PC pcf; 839488c03ad3SStefano Zampini 8395e4d548c7SStefano Zampini if (pcbddc->sub_schurs_rebuild) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot compute change of basis with a different graph"); 839688c03ad3SStefano Zampini ierr = PCCreate(PetscObjectComm((PetscObject)pc),&pcf);CHKERRQ(ierr); 839788c03ad3SStefano Zampini ierr = PCSetOperators(pcf,pc->mat,pc->pmat);CHKERRQ(ierr); 839888c03ad3SStefano Zampini ierr = PCSetType(pcf,PCBDDC);CHKERRQ(ierr); 8399b9be95fcSstefano_zampini 840088c03ad3SStefano Zampini /* hacks */ 840188c03ad3SStefano Zampini pcisf = (PC_IS*)pcf->data; 840272b8c272SStefano Zampini pcisf->is_B_local = pcis->is_B_local; 840372b8c272SStefano Zampini pcisf->vec1_N = pcis->vec1_N; 840472b8c272SStefano Zampini pcisf->BtoNmap = pcis->BtoNmap; 840572b8c272SStefano Zampini pcisf->n = pcis->n; 840672b8c272SStefano Zampini pcisf->n_B = pcis->n_B; 840788c03ad3SStefano Zampini pcbddcf = (PC_BDDC*)pcf->data; 840888c03ad3SStefano Zampini ierr = PetscFree(pcbddcf->mat_graph);CHKERRQ(ierr); 840988c03ad3SStefano Zampini pcbddcf->mat_graph = pcbddc->mat_graph; 841088c03ad3SStefano Zampini pcbddcf->use_faces = PETSC_TRUE; 841188c03ad3SStefano Zampini pcbddcf->use_change_of_basis = PETSC_TRUE; 841288c03ad3SStefano Zampini pcbddcf->use_change_on_faces = PETSC_TRUE; 841372b8c272SStefano Zampini pcbddcf->use_qr_single = PETSC_TRUE; 841488c03ad3SStefano Zampini pcbddcf->fake_change = PETSC_TRUE; 8415b9be95fcSstefano_zampini 8416b9be95fcSstefano_zampini /* setup constraints so that we can get information on primal vertices and change of basis (in local numbering) */ 841788c03ad3SStefano Zampini ierr = PCBDDCConstraintsSetUp(pcf);CHKERRQ(ierr); 841872b8c272SStefano Zampini sub_schurs->change_with_qr = pcbddcf->use_qr_single; 841972b8c272SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddcf->n_vertices,pcbddcf->local_primal_ref_node,PETSC_COPY_VALUES,&change_primal);CHKERRQ(ierr); 842072b8c272SStefano Zampini change = pcbddcf->ConstraintMatrix; 842172b8c272SStefano Zampini pcbddcf->ConstraintMatrix = NULL; 8422b9be95fcSstefano_zampini 842388c03ad3SStefano Zampini /* free unneeded memory allocated in PCBDDCConstraintsSetUp */ 842472b8c272SStefano Zampini ierr = PetscFree(pcbddcf->sub_schurs);CHKERRQ(ierr); 842588c03ad3SStefano Zampini ierr = MatNullSpaceDestroy(&pcbddcf->onearnullspace);CHKERRQ(ierr); 842688c03ad3SStefano Zampini ierr = PetscFree2(pcbddcf->local_primal_ref_node,pcbddcf->local_primal_ref_mult);CHKERRQ(ierr); 842788c03ad3SStefano Zampini ierr = PetscFree(pcbddcf->primal_indices_local_idxs);CHKERRQ(ierr); 842888c03ad3SStefano Zampini ierr = PetscFree(pcbddcf->onearnullvecs_state);CHKERRQ(ierr); 842988c03ad3SStefano Zampini ierr = PetscFree(pcf->data);CHKERRQ(ierr); 843088c03ad3SStefano Zampini pcf->ops->destroy = NULL; 8431b9be95fcSstefano_zampini pcf->ops->reset = NULL; 843288c03ad3SStefano Zampini ierr = PCDestroy(&pcf);CHKERRQ(ierr); 843388c03ad3SStefano Zampini } 84349d54b7f4SStefano Zampini if (!pcbddc->use_deluxe_scaling) scaling = pcis->D; 8435111315fdSstefano_zampini 8436111315fdSstefano_zampini ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr); 8437111315fdSstefano_zampini if (iP) { 8438111315fdSstefano_zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)iP),sub_schurs->prefix,"BDDC sub_schurs options","PC");CHKERRQ(ierr); 8439111315fdSstefano_zampini ierr = PetscOptionsBool("-sub_schurs_discrete_harmonic",NULL,NULL,discrete_harmonic,&discrete_harmonic,NULL);CHKERRQ(ierr); 8440111315fdSstefano_zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 8441111315fdSstefano_zampini } 8442111315fdSstefano_zampini if (discrete_harmonic) { 8443111315fdSstefano_zampini Mat A; 8444111315fdSstefano_zampini ierr = MatDuplicate(pcbddc->local_mat,MAT_COPY_VALUES,&A);CHKERRQ(ierr); 8445111315fdSstefano_zampini ierr = MatZeroRowsColumnsIS(A,iP,1.0,NULL,NULL);CHKERRQ(ierr); 8446111315fdSstefano_zampini ierr = PetscObjectCompose((PetscObject)A,"__KSPFETIDP_iP",(PetscObject)iP);CHKERRQ(ierr); 8447111315fdSstefano_zampini ierr = PCBDDCSubSchursSetUp(sub_schurs,A,S_j,pcbddc->sub_schurs_exact_schur,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,scaling,pcbddc->adaptive_selection,reuse_solvers,pcbddc->benign_saddle_point,benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_zerodiag_subs,change,change_primal);CHKERRQ(ierr); 8448111315fdSstefano_zampini ierr = MatDestroy(&A);CHKERRQ(ierr); 8449111315fdSstefano_zampini } else { 845091af6908SStefano Zampini ierr = PCBDDCSubSchursSetUp(sub_schurs,pcbddc->local_mat,S_j,pcbddc->sub_schurs_exact_schur,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,scaling,pcbddc->adaptive_selection,reuse_solvers,pcbddc->benign_saddle_point,benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_zerodiag_subs,change,change_primal);CHKERRQ(ierr); 8451111315fdSstefano_zampini } 845272b8c272SStefano Zampini ierr = MatDestroy(&change);CHKERRQ(ierr); 845372b8c272SStefano Zampini ierr = ISDestroy(&change_primal);CHKERRQ(ierr); 8454ca92afb2SStefano Zampini } 8455d12d3064SStefano Zampini ierr = MatDestroy(&S_j);CHKERRQ(ierr); 8456b96c3477SStefano Zampini 8457b96c3477SStefano Zampini /* free adjacency */ 8458b96c3477SStefano Zampini if (free_used_adj) { 8459b96c3477SStefano Zampini ierr = PetscFree2(used_xadj,used_adjncy);CHKERRQ(ierr); 8460b96c3477SStefano Zampini } 8461b96c3477SStefano Zampini PetscFunctionReturn(0); 8462b96c3477SStefano Zampini } 8463b96c3477SStefano Zampini 846408122e43SStefano Zampini PetscErrorCode PCBDDCInitSubSchurs(PC pc) 8465b96c3477SStefano Zampini { 8466b96c3477SStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 8467b96c3477SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 8468b96c3477SStefano Zampini PCBDDCGraph graph; 8469b96c3477SStefano Zampini PetscErrorCode ierr; 8470b96c3477SStefano Zampini 8471b96c3477SStefano Zampini PetscFunctionBegin; 8472b96c3477SStefano Zampini /* attach interface graph for determining subsets */ 847308122e43SStefano Zampini if (pcbddc->sub_schurs_rebuild) { /* in case rebuild has been requested, it uses a graph generated only by the neighbouring information */ 84743301b35fSStefano Zampini IS verticesIS,verticescomm; 84753301b35fSStefano Zampini PetscInt vsize,*idxs; 8476b96c3477SStefano Zampini 8477b96c3477SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&verticesIS);CHKERRQ(ierr); 84783301b35fSStefano Zampini ierr = ISGetSize(verticesIS,&vsize);CHKERRQ(ierr); 84793301b35fSStefano Zampini ierr = ISGetIndices(verticesIS,(const PetscInt**)&idxs);CHKERRQ(ierr); 84803301b35fSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),vsize,idxs,PETSC_COPY_VALUES,&verticescomm);CHKERRQ(ierr); 84813301b35fSStefano Zampini ierr = ISRestoreIndices(verticesIS,(const PetscInt**)&idxs);CHKERRQ(ierr); 8482c8272957SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&verticesIS);CHKERRQ(ierr); 8483b96c3477SStefano Zampini ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr); 8484be12c134Sstefano_zampini ierr = PCBDDCGraphInit(graph,pcbddc->mat_graph->l2gmap,pcbddc->mat_graph->nvtxs_global,pcbddc->graphmaxcount);CHKERRQ(ierr); 8485441e0de0SStefano Zampini ierr = PCBDDCGraphSetUp(graph,pcbddc->mat_graph->custom_minimal_size,NULL,pcbddc->DirichletBoundariesLocal,0,NULL,verticescomm);CHKERRQ(ierr); 84863301b35fSStefano Zampini ierr = ISDestroy(&verticescomm);CHKERRQ(ierr); 8487b96c3477SStefano Zampini ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr); 8488b96c3477SStefano Zampini } else { 8489b96c3477SStefano Zampini graph = pcbddc->mat_graph; 8490b96c3477SStefano Zampini } 8491e4d548c7SStefano Zampini /* print some info */ 84925c643e28SStefano Zampini if (pcbddc->dbg_flag && !pcbddc->sub_schurs_rebuild) { 8493e4d548c7SStefano Zampini IS vertices; 8494e4d548c7SStefano Zampini PetscInt nv,nedges,nfaces; 8495c8272957SStefano Zampini ierr = PCBDDCGraphASCIIView(graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr); 8496e4d548c7SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(graph,&nfaces,NULL,&nedges,NULL,&vertices);CHKERRQ(ierr); 8497e4d548c7SStefano Zampini ierr = ISGetSize(vertices,&nv);CHKERRQ(ierr); 8498e4d548c7SStefano Zampini ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8499e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 8500e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate vertices (%d)\n",PetscGlobalRank,nv,pcbddc->use_vertices);CHKERRQ(ierr); 8501e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate edges (%d)\n",PetscGlobalRank,nedges,pcbddc->use_edges);CHKERRQ(ierr); 8502e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate faces (%d)\n",PetscGlobalRank,nfaces,pcbddc->use_faces);CHKERRQ(ierr); 8503e4d548c7SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8504e4d548c7SStefano Zampini ierr = PetscViewerASCIIPopSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8505c8272957SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(graph,&nfaces,NULL,&nedges,NULL,&vertices);CHKERRQ(ierr); 8506e4d548c7SStefano Zampini } 8507b96c3477SStefano Zampini 8508b96c3477SStefano Zampini /* sub_schurs init */ 8509b334f244SStefano Zampini if (!pcbddc->sub_schurs) { 8510b334f244SStefano Zampini ierr = PCBDDCSubSchursCreate(&pcbddc->sub_schurs);CHKERRQ(ierr); 8511b334f244SStefano Zampini } 85128b6046baSStefano Zampini ierr = PCBDDCSubSchursInit(pcbddc->sub_schurs,pcis->is_I_local,pcis->is_B_local,graph,pcis->BtoNmap,pcbddc->sub_schurs_rebuild);CHKERRQ(ierr); 8513e62b6521Sstefano_zampini pcbddc->sub_schurs->prefix = ((PetscObject)pc)->prefix; 8514a64f4aa4SStefano Zampini 8515b96c3477SStefano Zampini /* free graph struct */ 851608122e43SStefano Zampini if (pcbddc->sub_schurs_rebuild) { 8517b96c3477SStefano Zampini ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr); 8518b96c3477SStefano Zampini } 8519b96c3477SStefano Zampini PetscFunctionReturn(0); 8520b96c3477SStefano Zampini } 8521fa34dd3eSStefano Zampini 8522fa34dd3eSStefano Zampini PetscErrorCode PCBDDCCheckOperator(PC pc) 8523fa34dd3eSStefano Zampini { 8524fa34dd3eSStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 8525fa34dd3eSStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 8526fa34dd3eSStefano Zampini PetscErrorCode ierr; 8527fa34dd3eSStefano Zampini 8528fa34dd3eSStefano Zampini PetscFunctionBegin; 8529fa34dd3eSStefano Zampini if (pcbddc->n_vertices == pcbddc->local_primal_size) { 8530fa34dd3eSStefano Zampini IS zerodiag = NULL; 85314f1b2e48SStefano Zampini Mat S_j,B0_B=NULL; 8532fa34dd3eSStefano Zampini Vec dummy_vec=NULL,vec_check_B,vec_scale_P; 85334f1b2e48SStefano Zampini PetscScalar *p0_check,*array,*array2; 853475c01103SStefano Zampini PetscReal norm; 8535fa34dd3eSStefano Zampini PetscInt i; 8536fa34dd3eSStefano Zampini 8537fa34dd3eSStefano Zampini /* B0 and B0_B */ 8538fa34dd3eSStefano Zampini if (zerodiag) { 8539fa34dd3eSStefano Zampini IS dummy; 8540fa34dd3eSStefano Zampini 85414f1b2e48SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&dummy);CHKERRQ(ierr); 85427dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->benign_B0,dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr); 8543fa34dd3eSStefano Zampini ierr = MatCreateVecs(B0_B,NULL,&dummy_vec);CHKERRQ(ierr); 8544fa34dd3eSStefano Zampini ierr = ISDestroy(&dummy);CHKERRQ(ierr); 8545fa34dd3eSStefano Zampini } 8546fa34dd3eSStefano Zampini /* I need a primal vector to scale primal nodes since BDDC sums contibutions */ 8547fa34dd3eSStefano Zampini ierr = VecDuplicate(pcbddc->vec1_P,&vec_scale_P);CHKERRQ(ierr); 8548fa34dd3eSStefano Zampini ierr = VecSet(pcbddc->vec1_P,1.0);CHKERRQ(ierr); 8549fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8550fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8551fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,vec_scale_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8552fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,vec_scale_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8553fa34dd3eSStefano Zampini ierr = VecReciprocal(vec_scale_P);CHKERRQ(ierr); 8554fa34dd3eSStefano Zampini /* S_j */ 8555fa34dd3eSStefano Zampini ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr); 8556fa34dd3eSStefano Zampini ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr); 8557fa34dd3eSStefano Zampini 8558fa34dd3eSStefano Zampini /* mimic vector in \widetilde{W}_\Gamma */ 8559fa34dd3eSStefano Zampini ierr = VecSetRandom(pcis->vec1_N,NULL);CHKERRQ(ierr); 8560fa34dd3eSStefano Zampini /* continuous in primal space */ 8561fa34dd3eSStefano Zampini ierr = VecSetRandom(pcbddc->coarse_vec,NULL);CHKERRQ(ierr); 8562fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8563fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8564fa34dd3eSStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 85654f1b2e48SStefano Zampini ierr = PetscCalloc1(pcbddc->benign_n,&p0_check);CHKERRQ(ierr); 85664f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) p0_check[i] = array[pcbddc->local_primal_size-pcbddc->benign_n+i]; 8567fa34dd3eSStefano Zampini ierr = VecSetValues(pcis->vec1_N,pcbddc->local_primal_size,pcbddc->local_primal_ref_node,array,INSERT_VALUES);CHKERRQ(ierr); 8568fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 8569fa34dd3eSStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 8570fa34dd3eSStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 8571fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8572fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8573fa34dd3eSStefano Zampini ierr = VecDuplicate(pcis->vec2_B,&vec_check_B);CHKERRQ(ierr); 8574fa34dd3eSStefano Zampini ierr = VecCopy(pcis->vec2_B,vec_check_B);CHKERRQ(ierr); 8575fa34dd3eSStefano Zampini 8576fa34dd3eSStefano Zampini /* assemble rhs for coarse problem */ 8577fa34dd3eSStefano Zampini /* widetilde{S}_\Gamma w_\Gamma + \widetilde{B0}^T_B p0 */ 8578fa34dd3eSStefano Zampini /* local with Schur */ 8579fa34dd3eSStefano Zampini ierr = MatMult(S_j,pcis->vec2_B,pcis->vec1_B);CHKERRQ(ierr); 8580fa34dd3eSStefano Zampini if (zerodiag) { 8581fa34dd3eSStefano Zampini ierr = VecGetArray(dummy_vec,&array);CHKERRQ(ierr); 85824f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) array[i] = p0_check[i]; 8583fa34dd3eSStefano Zampini ierr = VecRestoreArray(dummy_vec,&array);CHKERRQ(ierr); 8584fa34dd3eSStefano Zampini ierr = MatMultTransposeAdd(B0_B,dummy_vec,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 8585fa34dd3eSStefano Zampini } 8586fa34dd3eSStefano Zampini /* sum on primal nodes the local contributions */ 8587fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8588fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8589fa34dd3eSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8590fa34dd3eSStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 8591fa34dd3eSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) array2[i] = array[pcbddc->local_primal_ref_node[i]]; 8592fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 8593fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8594fa34dd3eSStefano Zampini ierr = VecSet(pcbddc->coarse_vec,0.);CHKERRQ(ierr); 8595fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8596fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8597fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8598fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8599fa34dd3eSStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 8600fa34dd3eSStefano Zampini /* scale primal nodes (BDDC sums contibutions) */ 8601fa34dd3eSStefano Zampini ierr = VecPointwiseMult(pcbddc->vec1_P,vec_scale_P,pcbddc->vec1_P);CHKERRQ(ierr); 8602fa34dd3eSStefano Zampini ierr = VecSetValues(pcis->vec1_N,pcbddc->local_primal_size,pcbddc->local_primal_ref_node,array,INSERT_VALUES);CHKERRQ(ierr); 8603fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 8604fa34dd3eSStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 8605fa34dd3eSStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 8606fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8607fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8608fa34dd3eSStefano Zampini /* global: \widetilde{B0}_B w_\Gamma */ 8609fa34dd3eSStefano Zampini if (zerodiag) { 8610fa34dd3eSStefano Zampini ierr = MatMult(B0_B,pcis->vec2_B,dummy_vec);CHKERRQ(ierr); 8611fa34dd3eSStefano Zampini ierr = VecGetArray(dummy_vec,&array);CHKERRQ(ierr); 86124f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = array[i]; 8613fa34dd3eSStefano Zampini ierr = VecRestoreArray(dummy_vec,&array);CHKERRQ(ierr); 8614fa34dd3eSStefano Zampini } 8615fa34dd3eSStefano Zampini /* BDDC */ 8616fa34dd3eSStefano Zampini ierr = VecSet(pcis->vec1_D,0.);CHKERRQ(ierr); 8617fa34dd3eSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc,PETSC_FALSE);CHKERRQ(ierr); 8618fa34dd3eSStefano Zampini 8619fa34dd3eSStefano Zampini ierr = VecCopy(pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 8620fa34dd3eSStefano Zampini ierr = VecAXPY(pcis->vec1_B,-1.0,vec_check_B);CHKERRQ(ierr); 8621fa34dd3eSStefano Zampini ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&norm);CHKERRQ(ierr); 8622fa34dd3eSStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] BDDC local error is %1.4e\n",PetscGlobalRank,norm); 86234f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 86244f1b2e48SStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] BDDC p0[%d] error is %1.4e\n",PetscGlobalRank,i,PetscAbsScalar(pcbddc->benign_p0[i]-p0_check[i])); 8625fa34dd3eSStefano Zampini } 86264f1b2e48SStefano Zampini ierr = PetscFree(p0_check);CHKERRQ(ierr); 8627fa34dd3eSStefano Zampini ierr = VecDestroy(&vec_scale_P);CHKERRQ(ierr); 8628fa34dd3eSStefano Zampini ierr = VecDestroy(&vec_check_B);CHKERRQ(ierr); 8629fa34dd3eSStefano Zampini ierr = VecDestroy(&dummy_vec);CHKERRQ(ierr); 8630fa34dd3eSStefano Zampini ierr = MatDestroy(&S_j);CHKERRQ(ierr); 8631fa34dd3eSStefano Zampini ierr = MatDestroy(&B0_B);CHKERRQ(ierr); 8632fa34dd3eSStefano Zampini } 8633fa34dd3eSStefano Zampini PetscFunctionReturn(0); 8634fa34dd3eSStefano Zampini } 86351e0482f5SStefano Zampini 86361e0482f5SStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 86371e0482f5SStefano Zampini PetscErrorCode MatMPIAIJRestrict(Mat A, MPI_Comm ccomm, Mat *B) 86381e0482f5SStefano Zampini { 86391e0482f5SStefano Zampini Mat At; 86401e0482f5SStefano Zampini IS rows; 86411e0482f5SStefano Zampini PetscInt rst,ren; 86421e0482f5SStefano Zampini PetscErrorCode ierr; 86431e0482f5SStefano Zampini PetscLayout rmap; 86441e0482f5SStefano Zampini 86451e0482f5SStefano Zampini PetscFunctionBegin; 86461e0482f5SStefano Zampini rst = ren = 0; 86471e0482f5SStefano Zampini if (ccomm != MPI_COMM_NULL) { 86481e0482f5SStefano Zampini ierr = PetscLayoutCreate(ccomm,&rmap);CHKERRQ(ierr); 86491e0482f5SStefano Zampini ierr = PetscLayoutSetSize(rmap,A->rmap->N);CHKERRQ(ierr); 86501e0482f5SStefano Zampini ierr = PetscLayoutSetBlockSize(rmap,1);CHKERRQ(ierr); 86511e0482f5SStefano Zampini ierr = PetscLayoutSetUp(rmap);CHKERRQ(ierr); 86521e0482f5SStefano Zampini ierr = PetscLayoutGetRange(rmap,&rst,&ren);CHKERRQ(ierr); 86531e0482f5SStefano Zampini } 8654e07686f2SStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)A),ren-rst,rst,1,&rows);CHKERRQ(ierr); 86557dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,rows,NULL,MAT_INITIAL_MATRIX,&At);CHKERRQ(ierr); 86561e0482f5SStefano Zampini ierr = ISDestroy(&rows);CHKERRQ(ierr); 86571e0482f5SStefano Zampini 86581e0482f5SStefano Zampini if (ccomm != MPI_COMM_NULL) { 86591e0482f5SStefano Zampini Mat_MPIAIJ *a,*b; 86601e0482f5SStefano Zampini IS from,to; 86611e0482f5SStefano Zampini Vec gvec; 86621e0482f5SStefano Zampini PetscInt lsize; 86631e0482f5SStefano Zampini 86641e0482f5SStefano Zampini ierr = MatCreate(ccomm,B);CHKERRQ(ierr); 86651e0482f5SStefano Zampini ierr = MatSetSizes(*B,ren-rst,PETSC_DECIDE,PETSC_DECIDE,At->cmap->N);CHKERRQ(ierr); 86661e0482f5SStefano Zampini ierr = MatSetType(*B,MATAIJ);CHKERRQ(ierr); 86671e0482f5SStefano Zampini ierr = PetscLayoutDestroy(&((*B)->rmap));CHKERRQ(ierr); 86681e0482f5SStefano Zampini ierr = PetscLayoutSetUp((*B)->cmap);CHKERRQ(ierr); 86691e0482f5SStefano Zampini a = (Mat_MPIAIJ*)At->data; 86701e0482f5SStefano Zampini b = (Mat_MPIAIJ*)(*B)->data; 86711e0482f5SStefano Zampini ierr = MPI_Comm_size(ccomm,&b->size);CHKERRQ(ierr); 86721e0482f5SStefano Zampini ierr = MPI_Comm_rank(ccomm,&b->rank);CHKERRQ(ierr); 86731e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)a->A);CHKERRQ(ierr); 86741e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)a->B);CHKERRQ(ierr); 86751e0482f5SStefano Zampini b->A = a->A; 86761e0482f5SStefano Zampini b->B = a->B; 86771e0482f5SStefano Zampini 86781e0482f5SStefano Zampini b->donotstash = a->donotstash; 86791e0482f5SStefano Zampini b->roworiented = a->roworiented; 86801e0482f5SStefano Zampini b->rowindices = 0; 86811e0482f5SStefano Zampini b->rowvalues = 0; 86821e0482f5SStefano Zampini b->getrowactive = PETSC_FALSE; 86831e0482f5SStefano Zampini 86841e0482f5SStefano Zampini (*B)->rmap = rmap; 86851e0482f5SStefano Zampini (*B)->factortype = A->factortype; 86861e0482f5SStefano Zampini (*B)->assembled = PETSC_TRUE; 86871e0482f5SStefano Zampini (*B)->insertmode = NOT_SET_VALUES; 86881e0482f5SStefano Zampini (*B)->preallocated = PETSC_TRUE; 86891e0482f5SStefano Zampini 86901e0482f5SStefano Zampini if (a->colmap) { 86911e0482f5SStefano Zampini #if defined(PETSC_USE_CTABLE) 86921e0482f5SStefano Zampini ierr = PetscTableCreateCopy(a->colmap,&b->colmap);CHKERRQ(ierr); 86931e0482f5SStefano Zampini #else 86941e0482f5SStefano Zampini ierr = PetscMalloc1(At->cmap->N,&b->colmap);CHKERRQ(ierr); 86951e0482f5SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)*B,At->cmap->N*sizeof(PetscInt));CHKERRQ(ierr); 86961e0482f5SStefano Zampini ierr = PetscMemcpy(b->colmap,a->colmap,At->cmap->N*sizeof(PetscInt));CHKERRQ(ierr); 86971e0482f5SStefano Zampini #endif 86981e0482f5SStefano Zampini } else b->colmap = 0; 86991e0482f5SStefano Zampini if (a->garray) { 87001e0482f5SStefano Zampini PetscInt len; 87011e0482f5SStefano Zampini len = a->B->cmap->n; 87021e0482f5SStefano Zampini ierr = PetscMalloc1(len+1,&b->garray);CHKERRQ(ierr); 87031e0482f5SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)(*B),len*sizeof(PetscInt));CHKERRQ(ierr); 87041e0482f5SStefano Zampini if (len) { ierr = PetscMemcpy(b->garray,a->garray,len*sizeof(PetscInt));CHKERRQ(ierr); } 87051e0482f5SStefano Zampini } else b->garray = 0; 87061e0482f5SStefano Zampini 87071e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)a->lvec);CHKERRQ(ierr); 87081e0482f5SStefano Zampini b->lvec = a->lvec; 87091e0482f5SStefano Zampini ierr = PetscLogObjectParent((PetscObject)*B,(PetscObject)b->lvec);CHKERRQ(ierr); 87101e0482f5SStefano Zampini 87111e0482f5SStefano Zampini /* cannot use VecScatterCopy */ 87121e0482f5SStefano Zampini ierr = VecGetLocalSize(b->lvec,&lsize);CHKERRQ(ierr); 87131e0482f5SStefano Zampini ierr = ISCreateGeneral(ccomm,lsize,b->garray,PETSC_USE_POINTER,&from);CHKERRQ(ierr); 87141e0482f5SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,lsize,0,1,&to);CHKERRQ(ierr); 87151e0482f5SStefano Zampini ierr = MatCreateVecs(*B,&gvec,NULL);CHKERRQ(ierr); 87161e0482f5SStefano Zampini ierr = VecScatterCreate(gvec,from,b->lvec,to,&b->Mvctx);CHKERRQ(ierr); 87171e0482f5SStefano Zampini ierr = PetscLogObjectParent((PetscObject)*B,(PetscObject)b->Mvctx);CHKERRQ(ierr); 87181e0482f5SStefano Zampini ierr = ISDestroy(&from);CHKERRQ(ierr); 87191e0482f5SStefano Zampini ierr = ISDestroy(&to);CHKERRQ(ierr); 87201e0482f5SStefano Zampini ierr = VecDestroy(&gvec);CHKERRQ(ierr); 87211e0482f5SStefano Zampini } 87221e0482f5SStefano Zampini ierr = MatDestroy(&At);CHKERRQ(ierr); 87231e0482f5SStefano Zampini PetscFunctionReturn(0); 87241e0482f5SStefano Zampini } 8725