11cf9b237SStefano Zampini #include <../src/mat/impls/aij/seq/aij.h> 2ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddc.h> 3ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddcprivate.h> 4c80a6c00SStefano Zampini #include <petscdmplex.h> 5674ae819SStefano Zampini #include <petscblaslapack.h> 6daf8a457SStefano Zampini #include <petsc/private/sfimpl.h> 7c80a6c00SStefano Zampini #include <petsc/private/dmpleximpl.h> 8674ae819SStefano Zampini 91e0482f5SStefano Zampini static PetscErrorCode MatMPIAIJRestrict(Mat,MPI_Comm,Mat*); 101e0482f5SStefano Zampini 11f498cd09SStefano Zampini /* if range is true, it returns B s.t. span{B} = range(A) 12f498cd09SStefano Zampini if range is false, it returns B s.t. range(B) _|_ range(A) */ 13f498cd09SStefano Zampini PetscErrorCode MatDenseOrthogonalRangeOrComplement(Mat A, PetscBool range, PetscInt lw, PetscScalar *work, PetscReal *rwork, Mat *B) 14a13144ffSStefano Zampini { 15a13144ffSStefano Zampini #if !defined(PETSC_USE_COMPLEX) 16a13144ffSStefano Zampini PetscScalar *uwork,*data,*U, ds = 0.; 17a13144ffSStefano Zampini PetscReal *sing; 18a13144ffSStefano Zampini PetscBLASInt bM,bN,lwork,lierr,di = 1; 19a13144ffSStefano Zampini PetscInt ulw,i,nr,nc,n; 20a13144ffSStefano Zampini PetscErrorCode ierr; 21a13144ffSStefano Zampini 22a13144ffSStefano Zampini PetscFunctionBegin; 23a13144ffSStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 24a13144ffSStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"LAPACK _GESVD not available"); 25614dbb09SStefano Zampini #else 26a13144ffSStefano Zampini ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr); 27a13144ffSStefano Zampini if (!nr || !nc) PetscFunctionReturn(0); 28a13144ffSStefano Zampini 29a13144ffSStefano Zampini /* workspace */ 30a13144ffSStefano Zampini if (!work) { 31a13144ffSStefano Zampini ulw = PetscMax(PetscMax(1,5*PetscMin(nr,nc)),3*PetscMin(nr,nc)+PetscMax(nr,nc)); 32f913dca9SStefano Zampini ierr = PetscMalloc1(ulw,&uwork);CHKERRQ(ierr); 33a13144ffSStefano Zampini } else { 34a13144ffSStefano Zampini ulw = lw; 35a13144ffSStefano Zampini uwork = work; 36a13144ffSStefano Zampini } 37a13144ffSStefano Zampini n = PetscMin(nr,nc); 38a13144ffSStefano Zampini if (!rwork) { 39a13144ffSStefano Zampini ierr = PetscMalloc1(n,&sing);CHKERRQ(ierr); 40a13144ffSStefano Zampini } else { 41a13144ffSStefano Zampini sing = rwork; 42a13144ffSStefano Zampini } 43a13144ffSStefano Zampini 44a13144ffSStefano Zampini /* SVD */ 45a13144ffSStefano Zampini ierr = PetscMalloc1(nr*nr,&U);CHKERRQ(ierr); 46a13144ffSStefano Zampini ierr = PetscBLASIntCast(nr,&bM);CHKERRQ(ierr); 47a13144ffSStefano Zampini ierr = PetscBLASIntCast(nc,&bN);CHKERRQ(ierr); 48a13144ffSStefano Zampini ierr = PetscBLASIntCast(ulw,&lwork);CHKERRQ(ierr); 49a13144ffSStefano Zampini ierr = MatDenseGetArray(A,&data);CHKERRQ(ierr); 50a13144ffSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 51a13144ffSStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("A","N",&bM,&bN,data,&bM,sing,U,&bM,&ds,&di,uwork,&lwork,&lierr)); 52a13144ffSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 53a13144ffSStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESVD Lapack routine %d",(int)lierr); 54a13144ffSStefano Zampini ierr = MatDenseRestoreArray(A,&data);CHKERRQ(ierr); 55a13144ffSStefano Zampini for (i=0;i<n;i++) if (sing[i] < PETSC_SMALL) break; 56a13144ffSStefano Zampini if (!rwork) { 57a13144ffSStefano Zampini ierr = PetscFree(sing);CHKERRQ(ierr); 58a13144ffSStefano Zampini } 59a13144ffSStefano Zampini if (!work) { 60a13144ffSStefano Zampini ierr = PetscFree(uwork);CHKERRQ(ierr); 61a13144ffSStefano Zampini } 62a13144ffSStefano Zampini /* create B */ 63f498cd09SStefano Zampini if (!range) { 64a13144ffSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,nr,nr-i,NULL,B);CHKERRQ(ierr); 65a13144ffSStefano Zampini ierr = MatDenseGetArray(*B,&data);CHKERRQ(ierr); 66a13144ffSStefano Zampini ierr = PetscMemcpy(data,U+nr*i,(nr-i)*nr*sizeof(PetscScalar));CHKERRQ(ierr); 67f498cd09SStefano Zampini } else { 68f498cd09SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,nr,i,NULL,B);CHKERRQ(ierr); 69f498cd09SStefano Zampini ierr = MatDenseGetArray(*B,&data);CHKERRQ(ierr); 70f498cd09SStefano Zampini ierr = PetscMemcpy(data,U,i*nr*sizeof(PetscScalar));CHKERRQ(ierr); 71f498cd09SStefano Zampini } 72a13144ffSStefano Zampini ierr = MatDenseRestoreArray(*B,&data);CHKERRQ(ierr); 73a13144ffSStefano Zampini ierr = PetscFree(U);CHKERRQ(ierr); 74614dbb09SStefano Zampini #endif 75614dbb09SStefano Zampini #else /* PETSC_USE_COMPLEX */ 76a13144ffSStefano Zampini PetscFunctionBegin; 77a13144ffSStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented for complexes"); 78a13144ffSStefano Zampini #endif 79a13144ffSStefano Zampini PetscFunctionReturn(0); 80a13144ffSStefano Zampini } 81a13144ffSStefano Zampini 821e0482f5SStefano Zampini /* TODO REMOVE */ 831e0482f5SStefano Zampini #if defined(PRINT_GDET) 841e0482f5SStefano Zampini static int inc = 0; 851e0482f5SStefano Zampini static int lev = 0; 861e0482f5SStefano Zampini #endif 871e0482f5SStefano Zampini 881e0482f5SStefano Zampini PetscErrorCode PCBDDCComputeNedelecChangeEdge(Mat lG, IS edge, IS extrow, IS extcol, IS corners, Mat* Gins, Mat* GKins, PetscScalar cvals[2], PetscScalar *work, PetscReal *rwork) 89a13144ffSStefano Zampini { 90a13144ffSStefano Zampini PetscErrorCode ierr; 91a13144ffSStefano Zampini Mat GE,GEd; 92a13144ffSStefano Zampini PetscInt rsize,csize,esize; 93a13144ffSStefano Zampini PetscScalar *ptr; 94a13144ffSStefano Zampini 95a13144ffSStefano Zampini PetscFunctionBegin; 96a13144ffSStefano Zampini ierr = ISGetSize(edge,&esize);CHKERRQ(ierr); 97c3c0e390SStefano Zampini if (!esize) PetscFunctionReturn(0); 98a13144ffSStefano Zampini ierr = ISGetSize(extrow,&rsize);CHKERRQ(ierr); 99a13144ffSStefano Zampini ierr = ISGetSize(extcol,&csize);CHKERRQ(ierr); 100a13144ffSStefano Zampini 101a13144ffSStefano Zampini /* gradients */ 102a13144ffSStefano Zampini ptr = work + 5*esize; 1037dae84e0SHong Zhang ierr = MatCreateSubMatrix(lG,extrow,extcol,MAT_INITIAL_MATRIX,&GE);CHKERRQ(ierr); 104a13144ffSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,rsize,csize,ptr,Gins);CHKERRQ(ierr); 105a13144ffSStefano Zampini ierr = MatConvert(GE,MATSEQDENSE,MAT_REUSE_MATRIX,Gins);CHKERRQ(ierr); 106a13144ffSStefano Zampini ierr = MatDestroy(&GE);CHKERRQ(ierr); 107a13144ffSStefano Zampini 108a13144ffSStefano Zampini /* constants */ 109a13144ffSStefano Zampini ptr += rsize*csize; 110a13144ffSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,esize,csize,ptr,&GEd);CHKERRQ(ierr); 1117dae84e0SHong Zhang ierr = MatCreateSubMatrix(lG,edge,extcol,MAT_INITIAL_MATRIX,&GE);CHKERRQ(ierr); 112a13144ffSStefano Zampini ierr = MatConvert(GE,MATSEQDENSE,MAT_REUSE_MATRIX,&GEd);CHKERRQ(ierr); 113a13144ffSStefano Zampini ierr = MatDestroy(&GE);CHKERRQ(ierr); 114f498cd09SStefano Zampini ierr = MatDenseOrthogonalRangeOrComplement(GEd,PETSC_FALSE,5*esize,work,rwork,GKins);CHKERRQ(ierr); 115a13144ffSStefano Zampini ierr = MatDestroy(&GEd);CHKERRQ(ierr); 1161e0482f5SStefano Zampini 1171e0482f5SStefano Zampini if (corners) { 1181e0482f5SStefano Zampini Mat GEc; 1191e0482f5SStefano Zampini PetscScalar *vals,v; 1201e0482f5SStefano Zampini 1217dae84e0SHong Zhang ierr = MatCreateSubMatrix(lG,edge,corners,MAT_INITIAL_MATRIX,&GEc);CHKERRQ(ierr); 1221e0482f5SStefano Zampini ierr = MatTransposeMatMult(GEc,*GKins,MAT_INITIAL_MATRIX,1.0,&GEd);CHKERRQ(ierr); 1231e0482f5SStefano Zampini ierr = MatDenseGetArray(GEd,&vals);CHKERRQ(ierr); 124637e8532SStefano Zampini /* v = PetscAbsScalar(vals[0]) */; 125637e8532SStefano Zampini v = 1.; 1261e0482f5SStefano Zampini cvals[0] = vals[0]/v; 1271e0482f5SStefano Zampini cvals[1] = vals[1]/v; 1281e0482f5SStefano Zampini ierr = MatDenseRestoreArray(GEd,&vals);CHKERRQ(ierr); 1291e0482f5SStefano Zampini ierr = MatScale(*GKins,1./v);CHKERRQ(ierr); 1301e0482f5SStefano Zampini #if defined(PRINT_GDET) 1311e0482f5SStefano Zampini { 1321e0482f5SStefano Zampini PetscViewer viewer; 1331e0482f5SStefano Zampini char filename[256]; 1341e0482f5SStefano Zampini sprintf(filename,"Gdet_l%d_r%d_cc%d.m",lev,PetscGlobalRank,inc++); 1351e0482f5SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&viewer);CHKERRQ(ierr); 1361e0482f5SStefano Zampini ierr = PetscViewerPushFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 1371e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)GEc,"GEc");CHKERRQ(ierr); 1381e0482f5SStefano Zampini ierr = MatView(GEc,viewer);CHKERRQ(ierr); 1391e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)(*GKins),"GK");CHKERRQ(ierr); 1401e0482f5SStefano Zampini ierr = MatView(*GKins,viewer);CHKERRQ(ierr); 1411e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)GEd,"Gproj");CHKERRQ(ierr); 1421e0482f5SStefano Zampini ierr = MatView(GEd,viewer);CHKERRQ(ierr); 1431e0482f5SStefano Zampini ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 1441e0482f5SStefano Zampini } 1451e0482f5SStefano Zampini #endif 1461e0482f5SStefano Zampini ierr = MatDestroy(&GEd);CHKERRQ(ierr); 1471e0482f5SStefano Zampini ierr = MatDestroy(&GEc);CHKERRQ(ierr); 1481e0482f5SStefano Zampini } 1491e0482f5SStefano Zampini 150a13144ffSStefano Zampini PetscFunctionReturn(0); 151a13144ffSStefano Zampini } 152a13144ffSStefano Zampini 153a13144ffSStefano Zampini PetscErrorCode PCBDDCNedelecSupport(PC pc) 154a13144ffSStefano Zampini { 155a13144ffSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 156a13144ffSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 1570569b399SStefano Zampini Mat G,T,conn,lG,lGt,lGis,lGall,lGe,lGinit; 158eee23b56SStefano Zampini Vec tvec; 159a13144ffSStefano Zampini PetscSF sfv; 1601e0482f5SStefano Zampini ISLocalToGlobalMapping el2g,vl2g,fl2g,al2g; 161a13144ffSStefano Zampini MPI_Comm comm; 162c2151214SStefano Zampini IS lned,primals,allprimals,nedfieldlocal; 163c2151214SStefano Zampini IS *eedges,*extrows,*extcols,*alleedges; 1647d871cd7SStefano Zampini PetscBT btv,bte,btvc,btb,btbd,btvcand,btvi,btee,bter; 165a13144ffSStefano Zampini PetscScalar *vals,*work; 166a13144ffSStefano Zampini PetscReal *rwork; 167a13144ffSStefano Zampini const PetscInt *idxs,*ii,*jj,*iit,*jjt; 1681e0482f5SStefano Zampini PetscInt ne,nv,Lv,order,n,field; 169a13144ffSStefano Zampini PetscInt n_neigh,*neigh,*n_shared,**shared; 170eee23b56SStefano Zampini PetscInt i,j,extmem,cum,maxsize,nee; 171b03ebc13SStefano Zampini PetscInt *extrow,*extrowcum,*marks,*vmarks,*gidxs; 172a13144ffSStefano Zampini PetscInt *sfvleaves,*sfvroots; 173b03ebc13SStefano Zampini PetscInt *corners,*cedges; 174637e8532SStefano Zampini PetscInt *ecount,**eneighs,*vcount,**vneighs; 175b03ebc13SStefano Zampini #if defined(PETSC_USE_DEBUG) 176b03ebc13SStefano Zampini PetscInt *emarks; 177b03ebc13SStefano Zampini #endif 178213b8bfaSStefano Zampini PetscBool print,eerr,done,lrc[2],conforming,global,singular,setprimal; 179a13144ffSStefano Zampini PetscErrorCode ierr; 180a13144ffSStefano Zampini 181a13144ffSStefano Zampini PetscFunctionBegin; 182213b8bfaSStefano Zampini /* If the discrete gradient is defined for a subset of dofs and global is true, 183213b8bfaSStefano Zampini it assumes G is given in global ordering for all the dofs. 184213b8bfaSStefano Zampini Otherwise, the ordering is global for the Nedelec field */ 185213b8bfaSStefano Zampini order = pcbddc->nedorder; 186213b8bfaSStefano Zampini conforming = pcbddc->conforming; 187213b8bfaSStefano Zampini field = pcbddc->nedfield; 188213b8bfaSStefano Zampini global = pcbddc->nedglobal; 189213b8bfaSStefano Zampini setprimal = PETSC_FALSE; 190a13144ffSStefano Zampini print = PETSC_FALSE; 191213b8bfaSStefano Zampini singular = PETSC_FALSE; 192a13144ffSStefano Zampini 193213b8bfaSStefano Zampini /* Command line customization */ 194213b8bfaSStefano Zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC Nedelec options","PC");CHKERRQ(ierr); 195213b8bfaSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_nedelec_field_primal","All edge dofs set as primals: Toselli's algorithm C",NULL,setprimal,&setprimal,NULL);CHKERRQ(ierr); 196213b8bfaSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_nedelec_singular","Infer nullspace from discrete gradient",NULL,singular,&singular,NULL);CHKERRQ(ierr); 197213b8bfaSStefano Zampini ierr = PetscOptionsInt("-pc_bddc_nedelec_order","Test variable order code (to be removed)",NULL,order,&order,NULL);CHKERRQ(ierr); 198213b8bfaSStefano Zampini /* print debug info TODO: to be removed */ 199213b8bfaSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_nedelec_print","Print debug info",NULL,print,&print,NULL);CHKERRQ(ierr); 200213b8bfaSStefano Zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 201213b8bfaSStefano Zampini 202213b8bfaSStefano Zampini /* Return if there are no edges in the decomposition and the problem is not singular */ 2031e0482f5SStefano Zampini ierr = MatGetLocalToGlobalMapping(pc->pmat,&al2g,NULL);CHKERRQ(ierr); 2041e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingGetSize(al2g,&n);CHKERRQ(ierr); 205213b8bfaSStefano Zampini ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 206213b8bfaSStefano Zampini if (!singular) { 207a13144ffSStefano Zampini ierr = VecGetArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 208a13144ffSStefano Zampini lrc[0] = PETSC_FALSE; 209c2151214SStefano Zampini for (i=0;i<n;i++) { 210a13144ffSStefano Zampini if (PetscRealPart(vals[i]) > 2.) { 211a13144ffSStefano Zampini lrc[0] = PETSC_TRUE; 212a13144ffSStefano Zampini break; 213a13144ffSStefano Zampini } 214a13144ffSStefano Zampini } 215a13144ffSStefano Zampini ierr = VecRestoreArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 216a13144ffSStefano Zampini ierr = MPIU_Allreduce(&lrc[0],&lrc[1],1,MPIU_BOOL,MPI_LOR,comm);CHKERRQ(ierr); 217a13144ffSStefano Zampini if (!lrc[1]) PetscFunctionReturn(0); 218213b8bfaSStefano Zampini } 219a13144ffSStefano Zampini 220213b8bfaSStefano Zampini /* Get Nedelec field */ 221213b8bfaSStefano Zampini ierr = MatISSetUpSF(pc->pmat);CHKERRQ(ierr); 222c2151214SStefano Zampini if (pcbddc->n_ISForDofsLocal && field >= pcbddc->n_ISForDofsLocal) SETERRQ2(comm,PETSC_ERR_USER,"Invalid field for Nedelec %d: number of fields is %d",field,pcbddc->n_ISForDofsLocal); 223213b8bfaSStefano Zampini if (pcbddc->n_ISForDofsLocal && field >= 0) { 224c2151214SStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ISForDofsLocal[field]);CHKERRQ(ierr); 225c2151214SStefano Zampini nedfieldlocal = pcbddc->ISForDofsLocal[field]; 226c2151214SStefano Zampini ierr = ISGetLocalSize(nedfieldlocal,&ne);CHKERRQ(ierr); 227213b8bfaSStefano Zampini } else if (!pcbddc->n_ISForDofsLocal && field != PETSC_DECIDE) { 228213b8bfaSStefano Zampini ne = n; 229213b8bfaSStefano Zampini nedfieldlocal = NULL; 230213b8bfaSStefano Zampini global = PETSC_TRUE; 231213b8bfaSStefano Zampini } else if (field == PETSC_DECIDE) { 232213b8bfaSStefano Zampini PetscInt rst,ren,*idx; 233213b8bfaSStefano Zampini 234213b8bfaSStefano Zampini ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscInt));CHKERRQ(ierr); 235213b8bfaSStefano Zampini ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 236213b8bfaSStefano Zampini ierr = MatGetOwnershipRange(pcbddc->discretegradient,&rst,&ren);CHKERRQ(ierr); 237213b8bfaSStefano Zampini for (i=rst;i<ren;i++) { 238213b8bfaSStefano Zampini PetscInt nc; 239213b8bfaSStefano Zampini 240213b8bfaSStefano Zampini ierr = MatGetRow(pcbddc->discretegradient,i,&nc,NULL,NULL);CHKERRQ(ierr); 241213b8bfaSStefano Zampini if (nc > 1) matis->sf_rootdata[i-rst] = 1; 242213b8bfaSStefano Zampini ierr = MatRestoreRow(pcbddc->discretegradient,i,&nc,NULL,NULL);CHKERRQ(ierr); 243213b8bfaSStefano Zampini } 244213b8bfaSStefano Zampini ierr = PetscSFBcastBegin(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 245213b8bfaSStefano Zampini ierr = PetscSFBcastEnd(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 246213b8bfaSStefano Zampini ierr = PetscMalloc1(n,&idx);CHKERRQ(ierr); 247213b8bfaSStefano Zampini for (i=0,ne=0;i<n;i++) if (matis->sf_leafdata[i]) idx[ne++] = i; 248213b8bfaSStefano Zampini ierr = ISCreateGeneral(comm,ne,idx,PETSC_OWN_POINTER,&nedfieldlocal);CHKERRQ(ierr); 249213b8bfaSStefano Zampini } else { 250213b8bfaSStefano Zampini SETERRQ(comm,PETSC_ERR_USER,"When multiple fields are present, the Nedelec field has to be specified"); 251213b8bfaSStefano Zampini } 252213b8bfaSStefano Zampini 253213b8bfaSStefano Zampini /* Sanity checks */ 254213b8bfaSStefano Zampini if (!order && !conforming) SETERRQ(comm,PETSC_ERR_SUP,"Variable order and non-conforming spaces are not supported at the same time"); 255213b8bfaSStefano Zampini if (pcbddc->user_ChangeOfBasisMatrix) SETERRQ(comm,PETSC_ERR_SUP,"Cannot generate Nedelec support with user defined change of basis"); 256213b8bfaSStefano Zampini if (order && ne%order) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"The number of local edge dofs %d it's not a multiple of the order %d",ne,order); 257213b8bfaSStefano Zampini 258213b8bfaSStefano Zampini /* Just set primal dofs and return */ 2591e0482f5SStefano Zampini if (setprimal) { 260eee23b56SStefano Zampini IS enedfieldlocal; 261eee23b56SStefano Zampini PetscInt *eidxs; 262eee23b56SStefano Zampini 263eee23b56SStefano Zampini ierr = PetscMalloc1(ne,&eidxs);CHKERRQ(ierr); 264eee23b56SStefano Zampini ierr = VecGetArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 265213b8bfaSStefano Zampini if (nedfieldlocal) { 266213b8bfaSStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 267eee23b56SStefano Zampini for (i=0,cum=0;i<ne;i++) { 268eee23b56SStefano Zampini if (PetscRealPart(vals[idxs[i]]) > 2.) { 269eee23b56SStefano Zampini eidxs[cum++] = idxs[i]; 270eee23b56SStefano Zampini } 271eee23b56SStefano Zampini } 272eee23b56SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 273213b8bfaSStefano Zampini } else { 274213b8bfaSStefano Zampini for (i=0,cum=0;i<ne;i++) { 275213b8bfaSStefano Zampini if (PetscRealPart(vals[i]) > 2.) { 276213b8bfaSStefano Zampini eidxs[cum++] = i; 277213b8bfaSStefano Zampini } 278213b8bfaSStefano Zampini } 279213b8bfaSStefano Zampini } 280213b8bfaSStefano Zampini ierr = VecRestoreArrayRead(matis->counter,(const PetscScalar**)&vals);CHKERRQ(ierr); 281eee23b56SStefano Zampini ierr = ISCreateGeneral(comm,cum,eidxs,PETSC_COPY_VALUES,&enedfieldlocal);CHKERRQ(ierr); 282eee23b56SStefano Zampini ierr = PCBDDCSetPrimalVerticesLocalIS(pc,enedfieldlocal);CHKERRQ(ierr); 283eee23b56SStefano Zampini ierr = PetscFree(eidxs);CHKERRQ(ierr); 2841e0482f5SStefano Zampini ierr = ISDestroy(&nedfieldlocal);CHKERRQ(ierr); 285eee23b56SStefano Zampini ierr = ISDestroy(&enedfieldlocal);CHKERRQ(ierr); 2861e0482f5SStefano Zampini PetscFunctionReturn(0); 2871e0482f5SStefano Zampini } 288a13144ffSStefano Zampini 289213b8bfaSStefano Zampini /* Compute some l2g maps */ 290213b8bfaSStefano Zampini if (nedfieldlocal) { 291c2151214SStefano Zampini IS is; 292c2151214SStefano Zampini 293c2151214SStefano Zampini /* need to map from the local Nedelec field to local numbering */ 294c2151214SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(nedfieldlocal,&fl2g);CHKERRQ(ierr); 2951e0482f5SStefano Zampini /* need to map from the local Nedelec field to global numbering for the whole dofs*/ 2961e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(al2g,nedfieldlocal,&is);CHKERRQ(ierr); 2971e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is,&al2g);CHKERRQ(ierr); 2981e0482f5SStefano Zampini /* need to map from the local Nedelec field to global numbering (for Nedelec only) */ 2991e0482f5SStefano Zampini if (global) { 3001e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr); 3011e0482f5SStefano Zampini el2g = al2g; 3021e0482f5SStefano Zampini } else { 3031e0482f5SStefano Zampini IS gis; 3041e0482f5SStefano Zampini 3051e0482f5SStefano Zampini ierr = ISRenumber(is,NULL,NULL,&gis);CHKERRQ(ierr); 3061e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(gis,&el2g);CHKERRQ(ierr); 3071e0482f5SStefano Zampini ierr = ISDestroy(&gis);CHKERRQ(ierr); 3081e0482f5SStefano Zampini } 309c2151214SStefano Zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 310c2151214SStefano Zampini } else { 3111e0482f5SStefano Zampini /* restore default */ 3121e0482f5SStefano Zampini pcbddc->nedfield = -1; 3131e0482f5SStefano Zampini /* one ref for the destruction of al2g, one for el2g */ 3141e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr); 3151e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)al2g);CHKERRQ(ierr); 3161e0482f5SStefano Zampini el2g = al2g; 317c2151214SStefano Zampini fl2g = NULL; 318c2151214SStefano Zampini } 319a13144ffSStefano Zampini 320213b8bfaSStefano Zampini /* Start communication to drop connections for interior edges (for cc analysis only) */ 321c2151214SStefano Zampini ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscInt));CHKERRQ(ierr); 322c2151214SStefano Zampini ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 323c2151214SStefano Zampini if (nedfieldlocal) { 324c2151214SStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 325c2151214SStefano Zampini for (i=0;i<ne;i++) matis->sf_leafdata[idxs[i]] = 1; 326c2151214SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 327c2151214SStefano Zampini } else { 328c2151214SStefano Zampini for (i=0;i<ne;i++) matis->sf_leafdata[i] = 1; 329c2151214SStefano Zampini } 330c2151214SStefano Zampini ierr = PetscSFReduceBegin(matis->sf,MPIU_INT,matis->sf_leafdata,matis->sf_rootdata,MPI_SUM);CHKERRQ(ierr); 331c2151214SStefano Zampini ierr = PetscSFReduceEnd(matis->sf,MPIU_INT,matis->sf_leafdata,matis->sf_rootdata,MPI_SUM);CHKERRQ(ierr); 332213b8bfaSStefano Zampini 333213b8bfaSStefano Zampini if (!singular) { /* drop connections with interior edges to avoid unneeded communications and memory movements */ 334213b8bfaSStefano Zampini ierr = MatDuplicate(pcbddc->discretegradient,MAT_COPY_VALUES,&G);CHKERRQ(ierr); 335213b8bfaSStefano Zampini ierr = MatSetOption(G,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr); 3361e0482f5SStefano Zampini if (global) { 3371e0482f5SStefano Zampini PetscInt rst; 3381e0482f5SStefano Zampini 339c2151214SStefano Zampini ierr = MatGetOwnershipRange(G,&rst,NULL);CHKERRQ(ierr); 340c2151214SStefano Zampini for (i=0,cum=0;i<pc->pmat->rmap->n;i++) { 341c2151214SStefano Zampini if (matis->sf_rootdata[i] < 2) { 342c2151214SStefano Zampini matis->sf_rootdata[cum++] = i + rst; 343c2151214SStefano Zampini } 344c2151214SStefano Zampini } 345a13144ffSStefano Zampini ierr = MatSetOption(G,MAT_NO_OFF_PROC_ZERO_ROWS,PETSC_TRUE);CHKERRQ(ierr); 346c2151214SStefano Zampini ierr = MatZeroRows(G,cum,matis->sf_rootdata,0.,NULL,NULL);CHKERRQ(ierr); 3471e0482f5SStefano Zampini } else { 3481e0482f5SStefano Zampini PetscInt *tbz; 3491e0482f5SStefano Zampini 3501e0482f5SStefano Zampini ierr = PetscMalloc1(ne,&tbz);CHKERRQ(ierr); 3511e0482f5SStefano Zampini ierr = PetscSFBcastBegin(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 3521e0482f5SStefano Zampini ierr = PetscSFBcastEnd(matis->sf,MPIU_INT,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 3531e0482f5SStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 3541e0482f5SStefano Zampini for (i=0,cum=0;i<ne;i++) 3551e0482f5SStefano Zampini if (matis->sf_leafdata[idxs[i]] == 1) 3561e0482f5SStefano Zampini tbz[cum++] = i; 3571e0482f5SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 3581e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApply(el2g,cum,tbz,tbz);CHKERRQ(ierr); 3591e0482f5SStefano Zampini ierr = MatZeroRows(G,cum,tbz,0.,NULL,NULL);CHKERRQ(ierr); 3601e0482f5SStefano Zampini ierr = PetscFree(tbz);CHKERRQ(ierr); 3611e0482f5SStefano Zampini } 362213b8bfaSStefano Zampini } else { /* we need the entire G to infer the nullspace */ 363213b8bfaSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->discretegradient);CHKERRQ(ierr); 364213b8bfaSStefano Zampini G = pcbddc->discretegradient; 365213b8bfaSStefano Zampini } 366a13144ffSStefano Zampini 367a13144ffSStefano Zampini /* Extract subdomain relevant rows of G */ 368a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(el2g,&idxs);CHKERRQ(ierr); 369a13144ffSStefano Zampini ierr = ISCreateGeneral(comm,ne,idxs,PETSC_USE_POINTER,&lned);CHKERRQ(ierr); 3707dae84e0SHong Zhang ierr = MatCreateSubMatrix(G,lned,NULL,MAT_INITIAL_MATRIX,&lGall);CHKERRQ(ierr); 371a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(el2g,&idxs);CHKERRQ(ierr); 372a13144ffSStefano Zampini ierr = ISDestroy(&lned);CHKERRQ(ierr); 373a13144ffSStefano Zampini ierr = MatConvert(lGall,MATIS,MAT_INITIAL_MATRIX,&lGis);CHKERRQ(ierr); 374a13144ffSStefano Zampini ierr = MatDestroy(&lGall);CHKERRQ(ierr); 375a13144ffSStefano Zampini ierr = MatISGetLocalMat(lGis,&lG);CHKERRQ(ierr); 376a13144ffSStefano Zampini 377213b8bfaSStefano Zampini /* SF for nodal dofs communications */ 378c2151214SStefano Zampini ierr = MatGetLocalSize(G,NULL,&Lv);CHKERRQ(ierr); 379a13144ffSStefano Zampini ierr = MatGetLocalToGlobalMapping(lGis,NULL,&vl2g);CHKERRQ(ierr); 380a13144ffSStefano Zampini ierr = PetscObjectReference((PetscObject)vl2g);CHKERRQ(ierr); 381a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetSize(vl2g,&nv);CHKERRQ(ierr); 382a13144ffSStefano Zampini ierr = PetscSFCreate(comm,&sfv);CHKERRQ(ierr); 383a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(vl2g,&idxs);CHKERRQ(ierr); 384a13144ffSStefano Zampini ierr = PetscSFSetGraphLayout(sfv,lGis->cmap,nv,NULL,PETSC_OWN_POINTER,idxs);CHKERRQ(ierr); 385a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(vl2g,&idxs);CHKERRQ(ierr); 386213b8bfaSStefano Zampini i = singular ? 2 : 1; 387213b8bfaSStefano Zampini ierr = PetscMalloc2(i*nv,&sfvleaves,i*Lv,&sfvroots);CHKERRQ(ierr); 388a13144ffSStefano Zampini 3891e0482f5SStefano Zampini /* Destroy temporary G created in MATIS format and modified G */ 390213b8bfaSStefano Zampini ierr = PetscObjectReference((PetscObject)lG);CHKERRQ(ierr); 391a13144ffSStefano Zampini ierr = MatDestroy(&lGis);CHKERRQ(ierr); 392213b8bfaSStefano Zampini ierr = MatDestroy(&G);CHKERRQ(ierr); 393a13144ffSStefano Zampini 394213b8bfaSStefano Zampini if (print) { 395213b8bfaSStefano Zampini ierr = PetscObjectSetName((PetscObject)lG,"initial_lG");CHKERRQ(ierr); 396213b8bfaSStefano Zampini ierr = MatView(lG,NULL);CHKERRQ(ierr); 397213b8bfaSStefano Zampini } 398213b8bfaSStefano Zampini 399213b8bfaSStefano Zampini /* Save lG for values insertion in change of basis */ 4000569b399SStefano Zampini ierr = MatDuplicate(lG,MAT_COPY_VALUES,&lGinit);CHKERRQ(ierr); 4010569b399SStefano Zampini 402a13144ffSStefano Zampini /* Analyze the edge-nodes connections (duplicate lG) */ 4034e64d54eSstefano_zampini ierr = MatDuplicate(lG,MAT_COPY_VALUES,&lGe);CHKERRQ(ierr); 4044e64d54eSstefano_zampini ierr = MatSetOption(lGe,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr); 405a13144ffSStefano Zampini ierr = PetscBTCreate(nv,&btv);CHKERRQ(ierr); 406a13144ffSStefano Zampini ierr = PetscBTCreate(ne,&bte);CHKERRQ(ierr); 407a13144ffSStefano Zampini ierr = PetscBTCreate(ne,&btb);CHKERRQ(ierr); 4087d871cd7SStefano Zampini ierr = PetscBTCreate(ne,&btbd);CHKERRQ(ierr); 409c2151214SStefano Zampini ierr = PetscBTCreate(nv,&btvcand);CHKERRQ(ierr); 410a13144ffSStefano Zampini /* need to import the boundary specification to ensure the 411a13144ffSStefano Zampini proper detection of coarse edges' endpoints */ 412a13144ffSStefano Zampini if (pcbddc->DirichletBoundariesLocal) { 413c2151214SStefano Zampini IS is; 414c2151214SStefano Zampini 415c2151214SStefano Zampini if (fl2g) { 416c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_MASK,pcbddc->DirichletBoundariesLocal,&is);CHKERRQ(ierr); 417c2151214SStefano Zampini } else { 418c2151214SStefano Zampini is = pcbddc->DirichletBoundariesLocal; 419c2151214SStefano Zampini } 420c2151214SStefano Zampini ierr = ISGetLocalSize(is,&cum);CHKERRQ(ierr); 421c2151214SStefano Zampini ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr); 422a13144ffSStefano Zampini for (i=0;i<cum;i++) { 423a13144ffSStefano Zampini if (idxs[i] >= 0) { 424a13144ffSStefano Zampini ierr = PetscBTSet(btb,idxs[i]);CHKERRQ(ierr); 4257d871cd7SStefano Zampini ierr = PetscBTSet(btbd,idxs[i]);CHKERRQ(ierr); 426a13144ffSStefano Zampini } 427a13144ffSStefano Zampini } 428c2151214SStefano Zampini ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr); 429c2151214SStefano Zampini if (fl2g) { 430c2151214SStefano Zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 431c2151214SStefano Zampini } 432a13144ffSStefano Zampini } 433a13144ffSStefano Zampini if (pcbddc->NeumannBoundariesLocal) { 434c2151214SStefano Zampini IS is; 435c2151214SStefano Zampini 436c2151214SStefano Zampini if (fl2g) { 437c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_MASK,pcbddc->NeumannBoundariesLocal,&is);CHKERRQ(ierr); 438c2151214SStefano Zampini } else { 439c2151214SStefano Zampini is = pcbddc->NeumannBoundariesLocal; 440c2151214SStefano Zampini } 441c2151214SStefano Zampini ierr = ISGetLocalSize(is,&cum);CHKERRQ(ierr); 442c2151214SStefano Zampini ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr); 443a13144ffSStefano Zampini for (i=0;i<cum;i++) { 444a13144ffSStefano Zampini if (idxs[i] >= 0) { 445a13144ffSStefano Zampini ierr = PetscBTSet(btb,idxs[i]);CHKERRQ(ierr); 446a13144ffSStefano Zampini } 447a13144ffSStefano Zampini } 448c2151214SStefano Zampini ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr); 449c2151214SStefano Zampini if (fl2g) { 450c2151214SStefano Zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 451a13144ffSStefano Zampini } 452c2151214SStefano Zampini } 453c2151214SStefano Zampini 454213b8bfaSStefano Zampini /* Count neighs per dof */ 455637e8532SStefano Zampini ierr = PetscCalloc1(ne,&ecount);CHKERRQ(ierr); 456637e8532SStefano Zampini ierr = PetscMalloc1(ne,&eneighs);CHKERRQ(ierr); 457637e8532SStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(el2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 458637e8532SStefano Zampini for (i=1,cum=0;i<n_neigh;i++) { 459637e8532SStefano Zampini cum += n_shared[i]; 460637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 461637e8532SStefano Zampini ecount[shared[i][j]]++; 462637e8532SStefano Zampini } 463637e8532SStefano Zampini } 464637e8532SStefano Zampini if (ne) { 465637e8532SStefano Zampini ierr = PetscMalloc1(cum,&eneighs[0]);CHKERRQ(ierr); 466637e8532SStefano Zampini } 467637e8532SStefano Zampini for (i=1;i<ne;i++) eneighs[i] = eneighs[i-1] + ecount[i-1]; 468637e8532SStefano Zampini ierr = PetscMemzero(ecount,ne*sizeof(PetscInt));CHKERRQ(ierr); 469637e8532SStefano Zampini for (i=1;i<n_neigh;i++) { 470637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 471637e8532SStefano Zampini PetscInt k = shared[i][j]; 472637e8532SStefano Zampini eneighs[k][ecount[k]] = neigh[i]; 473637e8532SStefano Zampini ecount[k]++; 474637e8532SStefano Zampini } 475637e8532SStefano Zampini } 476637e8532SStefano Zampini for (i=0;i<ne;i++) { 477637e8532SStefano Zampini ierr = PetscSortRemoveDupsInt(&ecount[i],eneighs[i]);CHKERRQ(ierr); 478637e8532SStefano Zampini } 479637e8532SStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(el2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 480637e8532SStefano Zampini ierr = PetscCalloc1(nv,&vcount);CHKERRQ(ierr); 481637e8532SStefano Zampini ierr = PetscMalloc1(nv,&vneighs);CHKERRQ(ierr); 482637e8532SStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 483637e8532SStefano Zampini for (i=1,cum=0;i<n_neigh;i++) { 484637e8532SStefano Zampini cum += n_shared[i]; 485637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 486637e8532SStefano Zampini vcount[shared[i][j]]++; 487637e8532SStefano Zampini } 488637e8532SStefano Zampini } 489637e8532SStefano Zampini if (nv) { 490637e8532SStefano Zampini ierr = PetscMalloc1(cum,&vneighs[0]);CHKERRQ(ierr); 491637e8532SStefano Zampini } 492637e8532SStefano Zampini for (i=1;i<nv;i++) vneighs[i] = vneighs[i-1] + vcount[i-1]; 493637e8532SStefano Zampini ierr = PetscMemzero(vcount,nv*sizeof(PetscInt));CHKERRQ(ierr); 494637e8532SStefano Zampini for (i=1;i<n_neigh;i++) { 495637e8532SStefano Zampini for (j=0;j<n_shared[i];j++) { 496637e8532SStefano Zampini PetscInt k = shared[i][j]; 497637e8532SStefano Zampini vneighs[k][vcount[k]] = neigh[i]; 498637e8532SStefano Zampini vcount[k]++; 499637e8532SStefano Zampini } 500637e8532SStefano Zampini } 501637e8532SStefano Zampini for (i=0;i<nv;i++) { 502637e8532SStefano Zampini ierr = PetscSortRemoveDupsInt(&vcount[i],vneighs[i]);CHKERRQ(ierr); 503637e8532SStefano Zampini } 504637e8532SStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 505637e8532SStefano Zampini 5067d871cd7SStefano Zampini /* need to remove coarse faces' dofs and coarse edges' dirichlet dofs 5077d871cd7SStefano Zampini for proper detection of coarse edges' endpoints */ 50862b0c6f7SStefano Zampini ierr = PetscBTCreate(ne,&btee);CHKERRQ(ierr); 50962b0c6f7SStefano Zampini for (i=0;i<ne;i++) { 5107d871cd7SStefano Zampini if ((ecount[i] > 1 && !PetscBTLookup(btbd,i)) || (ecount[i] == 1 && PetscBTLookup(btb,i))) { 51162b0c6f7SStefano Zampini ierr = PetscBTSet(btee,i);CHKERRQ(ierr); 51262b0c6f7SStefano Zampini } 51362b0c6f7SStefano Zampini } 514637e8532SStefano Zampini ierr = PetscMalloc1(ne,&marks);CHKERRQ(ierr); 51562b0c6f7SStefano Zampini if (!conforming) { 51662b0c6f7SStefano Zampini ierr = MatTranspose(lGe,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 51762b0c6f7SStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 51862b0c6f7SStefano Zampini } 5194e64d54eSstefano_zampini ierr = MatGetRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 520dec27d64SStefano Zampini ierr = MatSeqAIJGetArray(lGe,&vals);CHKERRQ(ierr); 52162b0c6f7SStefano Zampini cum = 0; 522a13144ffSStefano Zampini for (i=0;i<ne;i++) { 523dec27d64SStefano Zampini /* eliminate rows corresponding to edge dofs belonging to coarse faces */ 52462b0c6f7SStefano Zampini if (!PetscBTLookup(btee,i)) { 525a13144ffSStefano Zampini marks[cum++] = i; 526dec27d64SStefano Zampini continue; 527dec27d64SStefano Zampini } 528dec27d64SStefano Zampini /* set badly connected edge dofs as primal */ 52962b0c6f7SStefano Zampini if (!conforming) { 53062b0c6f7SStefano Zampini if (ii[i+1]-ii[i] != order + 1) { /* every row of G on the coarse edge should list order+1 nodal dofs */ 531a13144ffSStefano Zampini marks[cum++] = i; 532a13144ffSStefano Zampini ierr = PetscBTSet(bte,i);CHKERRQ(ierr); 533a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 534a13144ffSStefano Zampini ierr = PetscBTSet(btv,jj[j]);CHKERRQ(ierr); 535a13144ffSStefano Zampini } 53662b0c6f7SStefano Zampini } else { 53762b0c6f7SStefano Zampini /* every edge dofs should be connected trough a certain number of nodal dofs 53862b0c6f7SStefano Zampini to other edge dofs belonging to coarse edges 53962b0c6f7SStefano Zampini - at most 2 endpoints 54062b0c6f7SStefano Zampini - order-1 interior nodal dofs 54162b0c6f7SStefano Zampini - no undefined nodal dofs (nconn < order) 54262b0c6f7SStefano Zampini */ 54362b0c6f7SStefano Zampini PetscInt ends = 0,ints = 0, undef = 0; 54462b0c6f7SStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 54562b0c6f7SStefano Zampini PetscInt v = jj[j],k; 54662b0c6f7SStefano Zampini PetscInt nconn = iit[v+1]-iit[v]; 54762b0c6f7SStefano Zampini for (k=iit[v];k<iit[v+1];k++) if (!PetscBTLookup(btee,jjt[k])) nconn--; 54862b0c6f7SStefano Zampini if (nconn > order) ends++; 54962b0c6f7SStefano Zampini else if (nconn == order) ints++; 55062b0c6f7SStefano Zampini else undef++; 55162b0c6f7SStefano Zampini } 55262b0c6f7SStefano Zampini if (undef || ends > 2 || ints != order -1) { 55362b0c6f7SStefano Zampini marks[cum++] = i; 55462b0c6f7SStefano Zampini ierr = PetscBTSet(bte,i);CHKERRQ(ierr); 55562b0c6f7SStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 55662b0c6f7SStefano Zampini ierr = PetscBTSet(btv,jj[j]);CHKERRQ(ierr); 55762b0c6f7SStefano Zampini } 55862b0c6f7SStefano Zampini } 55962b0c6f7SStefano Zampini } 560a13144ffSStefano Zampini } 561dec27d64SStefano Zampini /* We assume the order on the element edge is ii[i+1]-ii[i]-1 */ 562dec27d64SStefano Zampini if (!order && ii[i+1] != ii[i]) { 563dec27d64SStefano Zampini PetscScalar val = 1./(ii[i+1]-ii[i]-1); 564dec27d64SStefano Zampini for (j=ii[i];j<ii[i+1];j++) vals[j] = val; 565a13144ffSStefano Zampini } 566dec27d64SStefano Zampini } 56762b0c6f7SStefano Zampini ierr = PetscBTDestroy(&btee);CHKERRQ(ierr); 568dec27d64SStefano Zampini ierr = MatSeqAIJRestoreArray(lGe,&vals);CHKERRQ(ierr); 5694e64d54eSstefano_zampini ierr = MatRestoreRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 57062b0c6f7SStefano Zampini if (!conforming) { 57162b0c6f7SStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 57262b0c6f7SStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 57362b0c6f7SStefano Zampini } 5744e64d54eSstefano_zampini ierr = MatZeroRows(lGe,cum,marks,0.,NULL,NULL);CHKERRQ(ierr); 575637e8532SStefano Zampini 576b03ebc13SStefano Zampini /* identify splitpoints and corner candidates */ 5774e64d54eSstefano_zampini ierr = MatTranspose(lGe,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 578a13144ffSStefano Zampini if (print) { 5794e64d54eSstefano_zampini ierr = PetscObjectSetName((PetscObject)lGe,"edgerestr_lG");CHKERRQ(ierr); 5804e64d54eSstefano_zampini ierr = MatView(lGe,NULL);CHKERRQ(ierr); 5814e64d54eSstefano_zampini ierr = PetscObjectSetName((PetscObject)lGt,"edgerestr_lGt");CHKERRQ(ierr); 582a13144ffSStefano Zampini ierr = MatView(lGt,NULL);CHKERRQ(ierr); 583a13144ffSStefano Zampini } 584a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 585dec27d64SStefano Zampini ierr = MatSeqAIJGetArray(lGt,&vals);CHKERRQ(ierr); 586a13144ffSStefano Zampini for (i=0;i<nv;i++) { 587637e8532SStefano Zampini PetscInt ord = order, test = ii[i+1]-ii[i], vc = vcount[i]; 5887d871cd7SStefano Zampini PetscBool sneighs = PETSC_TRUE, bdir = PETSC_FALSE; 589b03ebc13SStefano Zampini if (!order) { /* variable order */ 590dec27d64SStefano Zampini PetscReal vorder = 0.; 591dec27d64SStefano Zampini 592dec27d64SStefano Zampini for (j=ii[i];j<ii[i+1];j++) vorder += PetscRealPart(vals[j]); 593dec27d64SStefano Zampini test = PetscFloorReal(vorder+10.*PETSC_SQRT_MACHINE_EPSILON); 594dec27d64SStefano Zampini if (vorder-test > PETSC_SQRT_MACHINE_EPSILON) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected value for vorder: %g (%d)",vorder,test); 595dec27d64SStefano Zampini ord = 1; 596dec27d64SStefano Zampini } 597a13144ffSStefano Zampini #if defined(PETSC_USE_DEBUG) 598dec27d64SStefano Zampini if (test%ord) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected number of edge dofs %d connected with nodal dof %d with order %d",test,i,ord); 599a13144ffSStefano Zampini #endif 600637e8532SStefano Zampini for (j=ii[i];j<ii[i+1] && sneighs;j++) { 6017d871cd7SStefano Zampini if (PetscBTLookup(btbd,jj[j])) { 6027d871cd7SStefano Zampini bdir = PETSC_TRUE; 6037d871cd7SStefano Zampini break; 6047d871cd7SStefano Zampini } 605637e8532SStefano Zampini if (vc != ecount[jj[j]]) { 606637e8532SStefano Zampini sneighs = PETSC_FALSE; 607637e8532SStefano Zampini } else { 608637e8532SStefano Zampini PetscInt k,*vn = vneighs[i], *en = eneighs[jj[j]]; 609637e8532SStefano Zampini for (k=0;k<vc;k++) { 610637e8532SStefano Zampini if (vn[k] != en[k]) { 611637e8532SStefano Zampini sneighs = PETSC_FALSE; 612637e8532SStefano Zampini break; 613637e8532SStefano Zampini } 614637e8532SStefano Zampini } 615637e8532SStefano Zampini } 616637e8532SStefano Zampini } 6177d871cd7SStefano Zampini if (!sneighs || test >= 3*ord || bdir) { /* splitpoints */ 6187d871cd7SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"SPLITPOINT %d (%d %d %d)\n",i,!sneighs,test >= 3*ord,bdir); 619a13144ffSStefano Zampini ierr = PetscBTSet(btv,i);CHKERRQ(ierr); 620dec27d64SStefano Zampini } else if (test == ord) { 621b03ebc13SStefano Zampini if (order == 1 || (!order && ii[i+1]-ii[i] == 1)) { 622a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"ENDPOINT %d\n",i); 623a13144ffSStefano Zampini ierr = PetscBTSet(btv,i);CHKERRQ(ierr); 624a13144ffSStefano Zampini } else { 625a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"CORNER CANDIDATE %d\n",i); 626a13144ffSStefano Zampini ierr = PetscBTSet(btvcand,i);CHKERRQ(ierr); 627a13144ffSStefano Zampini } 628a13144ffSStefano Zampini } 629a13144ffSStefano Zampini } 630637e8532SStefano Zampini ierr = PetscFree(ecount);CHKERRQ(ierr); 631637e8532SStefano Zampini ierr = PetscFree(vcount);CHKERRQ(ierr); 632637e8532SStefano Zampini if (ne) { 633637e8532SStefano Zampini ierr = PetscFree(eneighs[0]);CHKERRQ(ierr); 634637e8532SStefano Zampini } 635637e8532SStefano Zampini if (nv) { 636637e8532SStefano Zampini ierr = PetscFree(vneighs[0]);CHKERRQ(ierr); 637637e8532SStefano Zampini } 638637e8532SStefano Zampini ierr = PetscFree(eneighs);CHKERRQ(ierr); 639637e8532SStefano Zampini ierr = PetscFree(vneighs);CHKERRQ(ierr); 6407d871cd7SStefano Zampini ierr = PetscBTDestroy(&btbd);CHKERRQ(ierr); 641b03ebc13SStefano Zampini 642b03ebc13SStefano Zampini /* a candidate is valid if it is connected to another candidate via a non-primal edge dof */ 643b03ebc13SStefano Zampini if (order != 1) { 644b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"INSPECTING CANDIDATES\n"); 645b03ebc13SStefano Zampini ierr = MatGetRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 646b03ebc13SStefano Zampini for (i=0;i<nv;i++) { 647b03ebc13SStefano Zampini if (PetscBTLookup(btvcand,i)) { 648b03ebc13SStefano Zampini PetscBool found = PETSC_FALSE; 649b03ebc13SStefano Zampini for (j=ii[i];j<ii[i+1] && !found;j++) { 650b03ebc13SStefano Zampini PetscInt k,e = jj[j]; 651b03ebc13SStefano Zampini if (PetscBTLookup(bte,e)) continue; 652b03ebc13SStefano Zampini for (k=iit[e];k<iit[e+1];k++) { 653b03ebc13SStefano Zampini PetscInt v = jjt[k]; 654b03ebc13SStefano Zampini if (v != i && PetscBTLookup(btvcand,v)) { 655b03ebc13SStefano Zampini found = PETSC_TRUE; 656b03ebc13SStefano Zampini break; 657b03ebc13SStefano Zampini } 658b03ebc13SStefano Zampini } 659b03ebc13SStefano Zampini } 660b03ebc13SStefano Zampini if (!found) { 661b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," CANDIDATE %d CLEARED\n",i); 662b03ebc13SStefano Zampini ierr = PetscBTClear(btvcand,i);CHKERRQ(ierr); 663b03ebc13SStefano Zampini } else { 664b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," CANDIDATE %d ACCEPTED\n",i); 665b03ebc13SStefano Zampini } 666b03ebc13SStefano Zampini } 667b03ebc13SStefano Zampini } 668b03ebc13SStefano Zampini ierr = MatRestoreRowIJ(lGe,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 669b03ebc13SStefano Zampini } 670dec27d64SStefano Zampini ierr = MatSeqAIJRestoreArray(lGt,&vals);CHKERRQ(ierr); 671a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 672b03ebc13SStefano Zampini ierr = MatDestroy(&lGe);CHKERRQ(ierr); 673a13144ffSStefano Zampini 674a13144ffSStefano Zampini /* Get the local G^T explicitly */ 6750569b399SStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 676a13144ffSStefano Zampini ierr = MatTranspose(lG,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 6774e64d54eSstefano_zampini ierr = MatSetOption(lGt,MAT_KEEP_NONZERO_PATTERN,PETSC_FALSE);CHKERRQ(ierr); 678a13144ffSStefano Zampini 6794e64d54eSstefano_zampini /* Mark interior nodal dofs */ 680a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 6814e64d54eSstefano_zampini ierr = PetscBTCreate(nv,&btvi);CHKERRQ(ierr); 682a13144ffSStefano Zampini for (i=1;i<n_neigh;i++) { 683a13144ffSStefano Zampini for (j=0;j<n_shared[i];j++) { 6844e64d54eSstefano_zampini ierr = PetscBTSet(btvi,shared[i][j]);CHKERRQ(ierr); 685a13144ffSStefano Zampini } 686a13144ffSStefano Zampini } 687a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(vl2g,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 688a13144ffSStefano Zampini 689a13144ffSStefano Zampini /* communicate corners and splitpoints */ 690a13144ffSStefano Zampini ierr = PetscMalloc1(nv,&vmarks);CHKERRQ(ierr); 691a13144ffSStefano Zampini ierr = PetscMemzero(sfvleaves,nv*sizeof(PetscInt));CHKERRQ(ierr); 692a13144ffSStefano Zampini ierr = PetscMemzero(sfvroots,Lv*sizeof(PetscInt));CHKERRQ(ierr); 693a13144ffSStefano Zampini for (i=0;i<nv;i++) if (PetscUnlikely(PetscBTLookup(btv,i))) sfvleaves[i] = 1; 694a13144ffSStefano Zampini 695a13144ffSStefano Zampini if (print) { 696a13144ffSStefano Zampini IS tbz; 697a13144ffSStefano Zampini 698a13144ffSStefano Zampini cum = 0; 699a13144ffSStefano Zampini for (i=0;i<nv;i++) 700a13144ffSStefano Zampini if (sfvleaves[i]) 701a13144ffSStefano Zampini vmarks[cum++] = i; 702a13144ffSStefano Zampini 703a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,vmarks,PETSC_COPY_VALUES,&tbz);CHKERRQ(ierr); 704a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)tbz,"corners_to_be_zeroed_local");CHKERRQ(ierr); 705a13144ffSStefano Zampini ierr = ISView(tbz,NULL);CHKERRQ(ierr); 706a13144ffSStefano Zampini ierr = ISDestroy(&tbz);CHKERRQ(ierr); 707a13144ffSStefano Zampini } 708a13144ffSStefano Zampini 709a13144ffSStefano Zampini ierr = PetscSFReduceBegin(sfv,MPIU_INT,sfvleaves,sfvroots,MPI_SUM);CHKERRQ(ierr); 710a13144ffSStefano Zampini ierr = PetscSFReduceEnd(sfv,MPIU_INT,sfvleaves,sfvroots,MPI_SUM);CHKERRQ(ierr); 711a13144ffSStefano Zampini ierr = PetscSFBcastBegin(sfv,MPIU_INT,sfvroots,sfvleaves);CHKERRQ(ierr); 712a13144ffSStefano Zampini ierr = PetscSFBcastEnd(sfv,MPIU_INT,sfvroots,sfvleaves);CHKERRQ(ierr); 713a13144ffSStefano Zampini 7144e64d54eSstefano_zampini /* Zero rows of lGt corresponding to identified corners 7154e64d54eSstefano_zampini and interior nodal dofs */ 716a13144ffSStefano Zampini cum = 0; 717a13144ffSStefano Zampini for (i=0;i<nv;i++) { 718a13144ffSStefano Zampini if (sfvleaves[i]) { 719a13144ffSStefano Zampini vmarks[cum++] = i; 720a13144ffSStefano Zampini ierr = PetscBTSet(btv,i);CHKERRQ(ierr); 721a13144ffSStefano Zampini } 7224e64d54eSstefano_zampini if (!PetscBTLookup(btvi,i)) vmarks[cum++] = i; 723a13144ffSStefano Zampini } 7244e64d54eSstefano_zampini ierr = PetscBTDestroy(&btvi);CHKERRQ(ierr); 725a13144ffSStefano Zampini if (print) { 726a13144ffSStefano Zampini IS tbz; 727a13144ffSStefano Zampini 728a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,vmarks,PETSC_COPY_VALUES,&tbz);CHKERRQ(ierr); 7294e64d54eSstefano_zampini ierr = PetscObjectSetName((PetscObject)tbz,"corners_to_be_zeroed_with_interior");CHKERRQ(ierr); 730a13144ffSStefano Zampini ierr = ISView(tbz,NULL);CHKERRQ(ierr); 731a13144ffSStefano Zampini ierr = ISDestroy(&tbz);CHKERRQ(ierr); 732a13144ffSStefano Zampini } 733a13144ffSStefano Zampini ierr = MatZeroRows(lGt,cum,vmarks,0.,NULL,NULL);CHKERRQ(ierr); 734a13144ffSStefano Zampini ierr = PetscFree(vmarks);CHKERRQ(ierr); 735a13144ffSStefano Zampini ierr = PetscSFDestroy(&sfv);CHKERRQ(ierr); 736a13144ffSStefano Zampini ierr = PetscFree2(sfvleaves,sfvroots);CHKERRQ(ierr); 737a13144ffSStefano Zampini 738a13144ffSStefano Zampini /* Recompute G */ 739a13144ffSStefano Zampini ierr = MatDestroy(&lG);CHKERRQ(ierr); 740a13144ffSStefano Zampini ierr = MatTranspose(lGt,MAT_INITIAL_MATRIX,&lG);CHKERRQ(ierr); 741a13144ffSStefano Zampini if (print) { 742a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)lG,"used_lG");CHKERRQ(ierr); 743a13144ffSStefano Zampini ierr = MatView(lG,NULL);CHKERRQ(ierr); 744a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)lGt,"used_lGt");CHKERRQ(ierr); 745a13144ffSStefano Zampini ierr = MatView(lGt,NULL);CHKERRQ(ierr); 746a13144ffSStefano Zampini } 747a13144ffSStefano Zampini 748a13144ffSStefano Zampini /* Get primal dofs (if any) */ 749a13144ffSStefano Zampini cum = 0; 750a13144ffSStefano Zampini for (i=0;i<ne;i++) { 751a13144ffSStefano Zampini if (PetscUnlikely(PetscBTLookup(bte,i))) marks[cum++] = i; 752a13144ffSStefano Zampini } 753c2151214SStefano Zampini if (fl2g) { 754c2151214SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,cum,marks,marks);CHKERRQ(ierr); 755c2151214SStefano Zampini } 756a13144ffSStefano Zampini ierr = ISCreateGeneral(comm,cum,marks,PETSC_COPY_VALUES,&primals);CHKERRQ(ierr); 757a13144ffSStefano Zampini if (print) { 758a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)primals,"prescribed_primal_dofs");CHKERRQ(ierr); 759a13144ffSStefano Zampini ierr = ISView(primals,NULL);CHKERRQ(ierr); 760a13144ffSStefano Zampini } 761a13144ffSStefano Zampini ierr = PetscBTDestroy(&bte);CHKERRQ(ierr); 762c2151214SStefano Zampini /* TODO: what if the user passed in some of them ? */ 763a13144ffSStefano Zampini ierr = PCBDDCSetPrimalVerticesLocalIS(pc,primals);CHKERRQ(ierr); 764a13144ffSStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 765a13144ffSStefano Zampini 766a13144ffSStefano Zampini /* Compute edge connectivity */ 767a13144ffSStefano Zampini ierr = PetscObjectSetOptionsPrefix((PetscObject)lG,"econn_");CHKERRQ(ierr); 768a13144ffSStefano Zampini ierr = MatMatMultSymbolic(lG,lGt,PETSC_DEFAULT,&conn);CHKERRQ(ierr); 769a13144ffSStefano Zampini ierr = MatGetRowIJ(conn,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 770c2151214SStefano Zampini if (fl2g) { 771c2151214SStefano Zampini PetscBT btf; 772c2151214SStefano Zampini PetscInt *iia,*jja,*iiu,*jju; 773c2151214SStefano Zampini PetscBool rest = PETSC_FALSE,free = PETSC_FALSE; 774c2151214SStefano Zampini 775c2151214SStefano Zampini /* create CSR for all local dofs */ 776c2151214SStefano Zampini ierr = PetscMalloc1(n+1,&iia);CHKERRQ(ierr); 777c2151214SStefano Zampini if (pcbddc->mat_graph->nvtxs_csr) { /* the user has passed in a CSR graph */ 778c2151214SStefano Zampini if (pcbddc->mat_graph->nvtxs_csr != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_USER,"Invalid size of CSR graph %d. Should be %d\n",pcbddc->mat_graph->nvtxs_csr,n); 779c2151214SStefano Zampini iiu = pcbddc->mat_graph->xadj; 780c2151214SStefano Zampini jju = pcbddc->mat_graph->adjncy; 781c2151214SStefano Zampini } else if (pcbddc->use_local_adj) { 782c2151214SStefano Zampini rest = PETSC_TRUE; 783c2151214SStefano Zampini ierr = MatGetRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&i,(const PetscInt**)&iiu,(const PetscInt**)&jju,&done);CHKERRQ(ierr); 784c2151214SStefano Zampini } else { 785c2151214SStefano Zampini free = PETSC_TRUE; 786c2151214SStefano Zampini ierr = PetscMalloc2(n+1,&iiu,n,&jju);CHKERRQ(ierr); 787c2151214SStefano Zampini iiu[0] = 0; 788c2151214SStefano Zampini for (i=0;i<n;i++) { 789c2151214SStefano Zampini iiu[i+1] = i+1; 790c2151214SStefano Zampini jju[i] = -1; 791d904f53bSStefano Zampini } 792c2151214SStefano Zampini } 793c2151214SStefano Zampini 794c2151214SStefano Zampini /* import sizes of CSR */ 795c2151214SStefano Zampini iia[0] = 0; 796c2151214SStefano Zampini for (i=0;i<n;i++) iia[i+1] = iiu[i+1]-iiu[i]; 797c2151214SStefano Zampini 798c2151214SStefano Zampini /* overwrite entries corresponding to the Nedelec field */ 799c2151214SStefano Zampini ierr = PetscBTCreate(n,&btf);CHKERRQ(ierr); 800c2151214SStefano Zampini ierr = ISGetIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 801c2151214SStefano Zampini for (i=0;i<ne;i++) { 802c2151214SStefano Zampini ierr = PetscBTSet(btf,idxs[i]);CHKERRQ(ierr); 803c2151214SStefano Zampini iia[idxs[i]+1] = ii[i+1]-ii[i]; 804c2151214SStefano Zampini } 805c2151214SStefano Zampini 806c2151214SStefano Zampini /* iia in CSR */ 807c2151214SStefano Zampini for (i=0;i<n;i++) iia[i+1] += iia[i]; 808c2151214SStefano Zampini 809c2151214SStefano Zampini /* jja in CSR */ 810c2151214SStefano Zampini ierr = PetscMalloc1(iia[n],&jja);CHKERRQ(ierr); 811c2151214SStefano Zampini for (i=0;i<n;i++) 812c2151214SStefano Zampini if (!PetscBTLookup(btf,i)) 813c2151214SStefano Zampini for (j=0;j<iiu[i+1]-iiu[i];j++) 814c2151214SStefano Zampini jja[iia[i]+j] = jju[iiu[i]+j]; 815c2151214SStefano Zampini 816c2151214SStefano Zampini /* map edge dofs connectivity */ 8171e0482f5SStefano Zampini if (jj) { 818c2151214SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,ii[ne],jj,(PetscInt *)jj);CHKERRQ(ierr); 819c2151214SStefano Zampini for (i=0;i<ne;i++) { 820c2151214SStefano Zampini PetscInt e = idxs[i]; 821c2151214SStefano Zampini for (j=0;j<ii[i+1]-ii[i];j++) jja[iia[e]+j] = jj[ii[i]+j]; 822c2151214SStefano Zampini } 8231e0482f5SStefano Zampini } 824c2151214SStefano Zampini ierr = ISRestoreIndices(nedfieldlocal,&idxs);CHKERRQ(ierr); 825c2151214SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,n,iia,jja,PETSC_OWN_POINTER);CHKERRQ(ierr); 826c2151214SStefano Zampini if (rest) { 827c2151214SStefano Zampini ierr = MatRestoreRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&i,(const PetscInt**)&iiu,(const PetscInt**)&jju,&done);CHKERRQ(ierr); 828c2151214SStefano Zampini } 829c2151214SStefano Zampini if (free) { 830c2151214SStefano Zampini ierr = PetscFree2(iiu,jju);CHKERRQ(ierr); 831c2151214SStefano Zampini } 832c2151214SStefano Zampini ierr = PetscBTDestroy(&btf);CHKERRQ(ierr); 833c2151214SStefano Zampini } else { 834c2151214SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,n,ii,jj,PETSC_USE_POINTER);CHKERRQ(ierr); 835c2151214SStefano Zampini } 836c2151214SStefano Zampini 837a13144ffSStefano Zampini /* Analyze interface for edge dofs */ 838a13144ffSStefano Zampini ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr); 839213b8bfaSStefano Zampini pcbddc->mat_graph->twodim = PETSC_FALSE; 840a13144ffSStefano Zampini 841a13144ffSStefano Zampini /* Get coarse edges in the edge space */ 842c2151214SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 843a13144ffSStefano Zampini ierr = MatRestoreRowIJ(conn,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 844a13144ffSStefano Zampini 845c2151214SStefano Zampini if (fl2g) { 846c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,allprimals,&primals);CHKERRQ(ierr); 847c2151214SStefano Zampini ierr = PetscMalloc1(nee,&eedges);CHKERRQ(ierr); 848c2151214SStefano Zampini for (i=0;i<nee;i++) { 849c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,alleedges[i],&eedges[i]);CHKERRQ(ierr); 850c2151214SStefano Zampini } 851c2151214SStefano Zampini } else { 852c2151214SStefano Zampini eedges = alleedges; 853c2151214SStefano Zampini primals = allprimals; 854c2151214SStefano Zampini } 855c2151214SStefano Zampini 856a13144ffSStefano Zampini /* Mark fine edge dofs with their coarse edge id */ 857a13144ffSStefano Zampini ierr = PetscMemzero(marks,ne*sizeof(PetscInt));CHKERRQ(ierr); 858c2151214SStefano Zampini ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr); 859c2151214SStefano Zampini ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr); 860c2151214SStefano Zampini for (i=0;i<cum;i++) marks[idxs[i]] = nee+1; 861c2151214SStefano Zampini ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr); 862c2151214SStefano Zampini if (print) { 863c2151214SStefano Zampini ierr = PetscObjectSetName((PetscObject)primals,"obtained_primal_dofs");CHKERRQ(ierr); 864c2151214SStefano Zampini ierr = ISView(primals,NULL);CHKERRQ(ierr); 865c2151214SStefano Zampini } 866c2151214SStefano Zampini 867c2151214SStefano Zampini maxsize = 0; 868a13144ffSStefano Zampini for (i=0;i<nee;i++) { 869a13144ffSStefano Zampini PetscInt size,mark = i+1; 870a13144ffSStefano Zampini 871a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 872a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 873a13144ffSStefano Zampini for (j=0;j<size;j++) marks[idxs[j]] = mark; 874a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 875a13144ffSStefano Zampini maxsize = PetscMax(maxsize,size); 876a13144ffSStefano Zampini } 877a13144ffSStefano Zampini 878a13144ffSStefano Zampini /* Find coarse edge endpoints */ 879a13144ffSStefano Zampini ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 880a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 881a13144ffSStefano Zampini for (i=0;i<nee;i++) { 882a13144ffSStefano Zampini PetscInt mark = i+1,size; 883a13144ffSStefano Zampini 884a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 8851e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 8861e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 887a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 888a13144ffSStefano Zampini if (print) { 889a13144ffSStefano Zampini PetscPrintf(PETSC_COMM_SELF,"ENDPOINTS ANALYSIS EDGE %d\n",i); 890a13144ffSStefano Zampini ISView(eedges[i],NULL); 891a13144ffSStefano Zampini } 892a13144ffSStefano Zampini for (j=0;j<size;j++) { 893a13144ffSStefano Zampini PetscInt k, ee = idxs[j]; 894a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," idx %d\n",ee); 895a13144ffSStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 896a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," inspect %d\n",jj[k]); 897a13144ffSStefano Zampini if (PetscBTLookup(btv,jj[k])) { 898a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," corner found (already set) %d\n",jj[k]); 899a13144ffSStefano Zampini } else if (PetscBTLookup(btvcand,jj[k])) { /* is it ok? */ 900a13144ffSStefano Zampini PetscInt k2; 901a13144ffSStefano Zampini PetscBool corner = PETSC_FALSE; 902a13144ffSStefano Zampini for (k2 = iit[jj[k]];k2 < iit[jj[k]+1];k2++) { 903c2151214SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," INSPECTING %d: mark %d (ref mark %d), boundary %d\n",jjt[k2],marks[jjt[k2]],mark,!!PetscBTLookup(btb,jjt[k2])); 904c2151214SStefano Zampini /* it's a corner if either is connected with an edge dof belonging to a different cc or 905c2151214SStefano Zampini if the edge dof lie on the natural part of the boundary */ 906c2151214SStefano Zampini if ((marks[jjt[k2]] && marks[jjt[k2]] != mark) || (!marks[jjt[k2]] && PetscBTLookup(btb,jjt[k2]))) { 907a13144ffSStefano Zampini corner = PETSC_TRUE; 908a13144ffSStefano Zampini break; 909a13144ffSStefano Zampini } 910a13144ffSStefano Zampini } 911a13144ffSStefano Zampini if (corner) { /* found the nodal dof corresponding to the endpoint of the edge */ 912a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," corner found %d\n",jj[k]); 913a13144ffSStefano Zampini ierr = PetscBTSet(btv,jj[k]);CHKERRQ(ierr); 914a13144ffSStefano Zampini } else { 915a13144ffSStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," no corners found\n"); 916a13144ffSStefano Zampini } 917a13144ffSStefano Zampini } 918a13144ffSStefano Zampini } 919a13144ffSStefano Zampini } 920a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 921a13144ffSStefano Zampini } 922a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 923a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 924c2151214SStefano Zampini ierr = PetscBTDestroy(&btb);CHKERRQ(ierr); 925a13144ffSStefano Zampini 926a13144ffSStefano Zampini /* Reset marked primal dofs */ 927a13144ffSStefano Zampini ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr); 928a13144ffSStefano Zampini ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr); 929a13144ffSStefano Zampini for (i=0;i<cum;i++) marks[idxs[i]] = 0; 930a13144ffSStefano Zampini ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr); 931a13144ffSStefano Zampini 9320569b399SStefano Zampini /* Now use the initial lG */ 9330569b399SStefano Zampini ierr = MatDestroy(&lG);CHKERRQ(ierr); 9340569b399SStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 9350569b399SStefano Zampini lG = lGinit; 9360569b399SStefano Zampini ierr = MatTranspose(lG,MAT_INITIAL_MATRIX,&lGt);CHKERRQ(ierr); 9370569b399SStefano Zampini 938a13144ffSStefano Zampini /* Compute extended cols indices */ 939b03ebc13SStefano Zampini ierr = PetscBTCreate(nv,&btvc);CHKERRQ(ierr); 940b03ebc13SStefano Zampini ierr = PetscBTCreate(nee,&bter);CHKERRQ(ierr); 941a13144ffSStefano Zampini ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 942a13144ffSStefano Zampini ierr = MatSeqAIJGetMaxRowNonzeros(lG,&i);CHKERRQ(ierr); 943a13144ffSStefano Zampini i *= maxsize; 944b03ebc13SStefano Zampini ierr = PetscCalloc1(nee,&extcols);CHKERRQ(ierr); 945a13144ffSStefano Zampini ierr = PetscMalloc2(i,&extrow,i,&gidxs);CHKERRQ(ierr); 946a13144ffSStefano Zampini eerr = PETSC_FALSE; 947a13144ffSStefano Zampini for (i=0;i<nee;i++) { 948b03ebc13SStefano Zampini PetscInt size,found = 0; 949a13144ffSStefano Zampini 950a13144ffSStefano Zampini cum = 0; 951a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 9521e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 9531e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 954a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 955b03ebc13SStefano Zampini ierr = PetscBTMemzero(nv,btvc);CHKERRQ(ierr); 956a13144ffSStefano Zampini for (j=0;j<size;j++) { 957a13144ffSStefano Zampini PetscInt k,ee = idxs[j]; 958b03ebc13SStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 959b03ebc13SStefano Zampini PetscInt vv = jj[k]; 960b03ebc13SStefano Zampini if (!PetscBTLookup(btv,vv)) extrow[cum++] = vv; 961b03ebc13SStefano Zampini else if (!PetscBTLookupSet(btvc,vv)) found++; 962b03ebc13SStefano Zampini } 963a13144ffSStefano Zampini } 964a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 965a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&cum,extrow);CHKERRQ(ierr); 966a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingApply(vl2g,cum,extrow,gidxs);CHKERRQ(ierr); 967a13144ffSStefano Zampini ierr = PetscSortIntWithArray(cum,gidxs,extrow);CHKERRQ(ierr); 968a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,extrow,PETSC_COPY_VALUES,&extcols[i]);CHKERRQ(ierr); 969a13144ffSStefano Zampini /* it may happen that endpoints are not defined at this point 970a13144ffSStefano Zampini if it is the case, mark this edge for a second pass */ 971b03ebc13SStefano Zampini if (cum != size -1 || found != 2) { 972b03ebc13SStefano Zampini ierr = PetscBTSet(bter,i);CHKERRQ(ierr); 973a13144ffSStefano Zampini if (print) { 974a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)eedges[i],"error_edge");CHKERRQ(ierr); 975a13144ffSStefano Zampini ierr = ISView(eedges[i],NULL);CHKERRQ(ierr); 976a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)extcols[i],"error_extcol");CHKERRQ(ierr); 977a13144ffSStefano Zampini ierr = ISView(extcols[i],NULL);CHKERRQ(ierr); 978a13144ffSStefano Zampini } 979a13144ffSStefano Zampini eerr = PETSC_TRUE; 980a13144ffSStefano Zampini } 981a13144ffSStefano Zampini } 9824e64d54eSstefano_zampini /* if (eerr) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected SIZE OF EDGE > EXTCOL FIRST PASS"); */ 983a13144ffSStefano Zampini ierr = MPIU_Allreduce(&eerr,&done,1,MPIU_BOOL,MPI_LOR,comm);CHKERRQ(ierr); 984a13144ffSStefano Zampini if (done) { 985a13144ffSStefano Zampini PetscInt *newprimals; 986a13144ffSStefano Zampini 987a13144ffSStefano Zampini ierr = PetscMalloc1(ne,&newprimals);CHKERRQ(ierr); 988a13144ffSStefano Zampini ierr = ISGetLocalSize(primals,&cum);CHKERRQ(ierr); 989a13144ffSStefano Zampini ierr = ISGetIndices(primals,&idxs);CHKERRQ(ierr); 990a13144ffSStefano Zampini ierr = PetscMemcpy(newprimals,idxs,cum*sizeof(PetscInt));CHKERRQ(ierr); 991a13144ffSStefano Zampini ierr = ISRestoreIndices(primals,&idxs);CHKERRQ(ierr); 9920569b399SStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 993b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"DOING SECOND PASS (eerr %d)\n",eerr); 994a13144ffSStefano Zampini for (i=0;i<nee;i++) { 995b03ebc13SStefano Zampini PetscBool has_candidates = PETSC_FALSE; 996b03ebc13SStefano Zampini if (PetscBTLookup(bter,i)) { 997a13144ffSStefano Zampini PetscInt size,mark = i+1; 998a13144ffSStefano Zampini 999a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 1000a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1001c2151214SStefano Zampini /* for (j=0;j<size;j++) newprimals[cum++] = idxs[j]; */ 1002a13144ffSStefano Zampini for (j=0;j<size;j++) { 1003a13144ffSStefano Zampini PetscInt k,ee = idxs[j]; 1004b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"Inspecting edge dof %d [%d %d)\n",ee,ii[ee],ii[ee+1]); 1005a13144ffSStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 1006a13144ffSStefano Zampini /* set all candidates located on the edge as corners */ 1007a13144ffSStefano Zampini if (PetscBTLookup(btvcand,jj[k])) { 1008a13144ffSStefano Zampini PetscInt k2,vv = jj[k]; 1009b03ebc13SStefano Zampini has_candidates = PETSC_TRUE; 1010b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Candidate set to vertex %d\n",vv); 1011a13144ffSStefano Zampini ierr = PetscBTSet(btv,vv);CHKERRQ(ierr); 1012a13144ffSStefano Zampini /* set all edge dofs connected to candidate as primals */ 1013a13144ffSStefano Zampini for (k2=iit[vv];k2<iit[vv+1];k2++) { 1014a13144ffSStefano Zampini if (marks[jjt[k2]] == mark) { 1015a13144ffSStefano Zampini PetscInt k3,ee2 = jjt[k2]; 1016b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Connected edge dof set to primal %d\n",ee2); 1017a13144ffSStefano Zampini newprimals[cum++] = ee2; 1018a13144ffSStefano Zampini /* finally set the new corners */ 1019a13144ffSStefano Zampini for (k3=ii[ee2];k3<ii[ee2+1];k3++) { 1020b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Connected nodal dof set to vertex %d\n",jj[k3]); 1021a13144ffSStefano Zampini ierr = PetscBTSet(btv,jj[k3]);CHKERRQ(ierr); 1022a13144ffSStefano Zampini } 1023a13144ffSStefano Zampini } 1024a13144ffSStefano Zampini } 1025b03ebc13SStefano Zampini } else { 1026b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Not a candidate vertex %d\n",jj[k]); 1027a13144ffSStefano Zampini } 1028a13144ffSStefano Zampini } 1029a13144ffSStefano Zampini } 1030b03ebc13SStefano Zampini if (!has_candidates) { /* circular edge */ 1031b03ebc13SStefano Zampini PetscInt k, ee = idxs[0],*tmarks; 1032b03ebc13SStefano Zampini 1033b03ebc13SStefano Zampini ierr = PetscCalloc1(ne,&tmarks);CHKERRQ(ierr); 1034b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Circular edge %d\n",i); 1035b03ebc13SStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) { 1036b03ebc13SStefano Zampini PetscInt k2; 1037b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Set to corner %d\n",jj[k]); 1038b03ebc13SStefano Zampini ierr = PetscBTSet(btv,jj[k]);CHKERRQ(ierr); 1039b03ebc13SStefano Zampini for (k2=iit[jj[k]];k2<iit[jj[k]+1];k2++) tmarks[jjt[k2]]++; 1040b03ebc13SStefano Zampini } 1041b03ebc13SStefano Zampini for (j=0;j<size;j++) { 1042b03ebc13SStefano Zampini if (tmarks[idxs[j]] > 1) { 1043b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF," Edge dof set to primal %d\n",idxs[j]); 1044b03ebc13SStefano Zampini newprimals[cum++] = idxs[j]; 1045b03ebc13SStefano Zampini } 1046b03ebc13SStefano Zampini } 1047b03ebc13SStefano Zampini ierr = PetscFree(tmarks);CHKERRQ(ierr); 1048b03ebc13SStefano Zampini } 1049a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1050a13144ffSStefano Zampini } 1051a13144ffSStefano Zampini ierr = ISDestroy(&extcols[i]);CHKERRQ(ierr); 1052a13144ffSStefano Zampini } 1053b03ebc13SStefano Zampini ierr = PetscFree(extcols);CHKERRQ(ierr); 10540569b399SStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&iit,&jjt,&done);CHKERRQ(ierr); 1055a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&cum,newprimals);CHKERRQ(ierr); 1056c2151214SStefano Zampini if (fl2g) { 1057c2151214SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,cum,newprimals,newprimals);CHKERRQ(ierr); 1058c2151214SStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 1059c2151214SStefano Zampini for (i=0;i<nee;i++) { 1060c2151214SStefano Zampini ierr = ISDestroy(&eedges[i]);CHKERRQ(ierr); 1061c2151214SStefano Zampini } 1062c2151214SStefano Zampini ierr = PetscFree(eedges);CHKERRQ(ierr); 1063c2151214SStefano Zampini } 1064c2151214SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 1065a13144ffSStefano Zampini ierr = ISCreateGeneral(comm,cum,newprimals,PETSC_COPY_VALUES,&primals);CHKERRQ(ierr); 1066a13144ffSStefano Zampini ierr = PetscFree(newprimals);CHKERRQ(ierr); 1067a13144ffSStefano Zampini ierr = PCBDDCSetPrimalVerticesLocalIS(pc,primals);CHKERRQ(ierr); 1068a13144ffSStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 1069a13144ffSStefano Zampini ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr); 1070213b8bfaSStefano Zampini pcbddc->mat_graph->twodim = PETSC_FALSE; 1071c2151214SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 1072c2151214SStefano Zampini if (fl2g) { 1073c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,allprimals,&primals);CHKERRQ(ierr); 1074c2151214SStefano Zampini ierr = PetscMalloc1(nee,&eedges);CHKERRQ(ierr); 1075c2151214SStefano Zampini for (i=0;i<nee;i++) { 1076c2151214SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(fl2g,IS_GTOLM_DROP,alleedges[i],&eedges[i]);CHKERRQ(ierr); 1077c2151214SStefano Zampini } 1078c2151214SStefano Zampini } else { 1079c2151214SStefano Zampini eedges = alleedges; 1080c2151214SStefano Zampini primals = allprimals; 1081c2151214SStefano Zampini } 1082b03ebc13SStefano Zampini ierr = PetscCalloc1(nee,&extcols);CHKERRQ(ierr); 1083a13144ffSStefano Zampini 1084a13144ffSStefano Zampini /* Mark again */ 1085a13144ffSStefano Zampini ierr = PetscMemzero(marks,ne*sizeof(PetscInt));CHKERRQ(ierr); 1086a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1087a13144ffSStefano Zampini PetscInt size,mark = i+1; 1088a13144ffSStefano Zampini 1089a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 1090a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1091a13144ffSStefano Zampini for (j=0;j<size;j++) marks[idxs[j]] = mark; 1092a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1093a13144ffSStefano Zampini } 1094a13144ffSStefano Zampini if (print) { 1095a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)primals,"obtained_primal_dofs_secondpass");CHKERRQ(ierr); 1096a13144ffSStefano Zampini ierr = ISView(primals,NULL);CHKERRQ(ierr); 1097a13144ffSStefano Zampini } 1098a13144ffSStefano Zampini 1099a13144ffSStefano Zampini /* Recompute extended cols */ 1100a13144ffSStefano Zampini eerr = PETSC_FALSE; 1101a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1102a13144ffSStefano Zampini PetscInt size; 1103a13144ffSStefano Zampini 1104a13144ffSStefano Zampini cum = 0; 1105a13144ffSStefano Zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 11061e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 11071e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 1108a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1109a13144ffSStefano Zampini for (j=0;j<size;j++) { 1110a13144ffSStefano Zampini PetscInt k,ee = idxs[j]; 11111e0482f5SStefano Zampini for (k=ii[ee];k<ii[ee+1];k++) if (!PetscBTLookup(btv,jj[k])) extrow[cum++] = jj[k]; 1112a13144ffSStefano Zampini } 1113a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1114a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&cum,extrow);CHKERRQ(ierr); 1115a13144ffSStefano Zampini ierr = ISLocalToGlobalMappingApply(vl2g,cum,extrow,gidxs);CHKERRQ(ierr); 1116a13144ffSStefano Zampini ierr = PetscSortIntWithArray(cum,gidxs,extrow);CHKERRQ(ierr); 1117a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cum,extrow,PETSC_COPY_VALUES,&extcols[i]);CHKERRQ(ierr); 1118a13144ffSStefano Zampini if (cum != size -1) { 1119a13144ffSStefano Zampini if (print) { 1120a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)eedges[i],"error_edge_secondpass");CHKERRQ(ierr); 1121a13144ffSStefano Zampini ierr = ISView(eedges[i],NULL);CHKERRQ(ierr); 1122a13144ffSStefano Zampini ierr = PetscObjectSetName((PetscObject)extcols[i],"error_extcol_secondpass");CHKERRQ(ierr); 1123a13144ffSStefano Zampini ierr = ISView(extcols[i],NULL);CHKERRQ(ierr); 1124a13144ffSStefano Zampini } 1125a13144ffSStefano Zampini eerr = PETSC_TRUE; 1126a13144ffSStefano Zampini } 1127a13144ffSStefano Zampini } 1128a13144ffSStefano Zampini } 1129a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1130a13144ffSStefano Zampini ierr = PetscFree2(extrow,gidxs);CHKERRQ(ierr); 1131b03ebc13SStefano Zampini ierr = PetscBTDestroy(&bter);CHKERRQ(ierr); 11327d871cd7SStefano Zampini if (print) { ierr = PCBDDCGraphASCIIView(pcbddc->mat_graph,5,PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr); } 1133a13144ffSStefano Zampini /* an error should not occur at this point */ 1134a13144ffSStefano Zampini if (eerr) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected SIZE OF EDGE > EXTCOL SECOND PASS"); 1135a13144ffSStefano Zampini 11364e64d54eSstefano_zampini /* Check the number of endpoints */ 11370569b399SStefano Zampini ierr = MatGetRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1138b03ebc13SStefano Zampini ierr = PetscMalloc1(2*nee,&corners);CHKERRQ(ierr); 1139b03ebc13SStefano Zampini ierr = PetscMalloc1(nee,&cedges);CHKERRQ(ierr); 11404e64d54eSstefano_zampini for (i=0;i<nee;i++) { 1141b03ebc13SStefano Zampini PetscInt size, found = 0, gc[2]; 11424e64d54eSstefano_zampini 1143b03ebc13SStefano Zampini /* init with defaults */ 1144b03ebc13SStefano Zampini cedges[i] = corners[i*2] = corners[i*2+1] = -1; 11454e64d54eSstefano_zampini ierr = ISGetLocalSize(eedges[i],&size);CHKERRQ(ierr); 11461e0482f5SStefano Zampini if (!size && nedfieldlocal) continue; 11471e0482f5SStefano Zampini if (!size) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Unexpected zero sized edge %d",i); 11484e64d54eSstefano_zampini ierr = ISGetIndices(eedges[i],&idxs);CHKERRQ(ierr); 1149b03ebc13SStefano Zampini ierr = PetscBTMemzero(nv,btvc);CHKERRQ(ierr); 11504e64d54eSstefano_zampini for (j=0;j<size;j++) { 11514e64d54eSstefano_zampini PetscInt k,ee = idxs[j]; 11524e64d54eSstefano_zampini for (k=ii[ee];k<ii[ee+1];k++) { 11534e64d54eSstefano_zampini PetscInt vv = jj[k]; 11544e64d54eSstefano_zampini if (PetscBTLookup(btv,vv) && !PetscBTLookupSet(btvc,vv)) { 1155b03ebc13SStefano Zampini if (found == 2) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Found more then two corners for edge %d\n",i); 1156b03ebc13SStefano Zampini corners[i*2+found++] = vv; 11574e64d54eSstefano_zampini } 11584e64d54eSstefano_zampini } 11594e64d54eSstefano_zampini } 1160b03ebc13SStefano Zampini if (found != 2) { 1161b03ebc13SStefano Zampini PetscInt e; 1162b03ebc13SStefano Zampini if (fl2g) { 1163b03ebc13SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,1,idxs,&e);CHKERRQ(ierr); 1164b03ebc13SStefano Zampini } else { 1165b03ebc13SStefano Zampini e = idxs[0]; 1166b03ebc13SStefano Zampini } 1167b03ebc13SStefano Zampini SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Found %d corners for edge %d (astart %d, estart %d)\n",found,i,e,idxs[0]); 1168b03ebc13SStefano Zampini } 1169eee23b56SStefano Zampini 1170eee23b56SStefano Zampini /* get primal dof index on this coarse edge */ 1171b03ebc13SStefano Zampini ierr = ISLocalToGlobalMappingApply(vl2g,2,corners+2*i,gc);CHKERRQ(ierr); 1172b03ebc13SStefano Zampini if (gc[0] > gc[1]) { 1173b03ebc13SStefano Zampini PetscInt swap = corners[2*i]; 1174b03ebc13SStefano Zampini corners[2*i] = corners[2*i+1]; 1175b03ebc13SStefano Zampini corners[2*i+1] = swap; 1176b03ebc13SStefano Zampini } 1177eee23b56SStefano Zampini cedges[i] = idxs[size-1]; 11784e64d54eSstefano_zampini ierr = ISRestoreIndices(eedges[i],&idxs);CHKERRQ(ierr); 1179b03ebc13SStefano Zampini if (print) PetscPrintf(PETSC_COMM_SELF,"EDGE %d: ce %d, corners (%d,%d)\n",i,cedges[i],corners[2*i],corners[2*i+1]); 11804e64d54eSstefano_zampini } 11810569b399SStefano Zampini ierr = MatRestoreRowIJ(lG,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 11824e64d54eSstefano_zampini ierr = PetscBTDestroy(&btvc);CHKERRQ(ierr); 11834e64d54eSstefano_zampini 1184a13144ffSStefano Zampini #if defined(PETSC_USE_DEBUG) 1185a13144ffSStefano Zampini /* Inspects columns of lG (rows of lGt) and make sure the change of basis will 1186a13144ffSStefano Zampini not interfere with neighbouring coarse edges */ 1187a13144ffSStefano Zampini ierr = PetscMalloc1(nee+1,&emarks);CHKERRQ(ierr); 1188a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1189a13144ffSStefano Zampini for (i=0;i<nv;i++) { 1190a13144ffSStefano Zampini PetscInt emax = 0,eemax = 0; 1191a13144ffSStefano Zampini 1192a13144ffSStefano Zampini if (ii[i+1]==ii[i] || PetscBTLookup(btv,i)) continue; 1193a13144ffSStefano Zampini ierr = PetscMemzero(emarks,(nee+1)*sizeof(PetscInt));CHKERRQ(ierr); 1194a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) emarks[marks[jj[j]]]++; 1195a13144ffSStefano Zampini for (j=1;j<nee+1;j++) { 1196a13144ffSStefano Zampini if (emax < emarks[j]) { 1197a13144ffSStefano Zampini emax = emarks[j]; 1198a13144ffSStefano Zampini eemax = j; 1199a13144ffSStefano Zampini } 1200a13144ffSStefano Zampini } 1201a13144ffSStefano Zampini /* not relevant for edges */ 1202a13144ffSStefano Zampini if (!eemax) continue; 1203a13144ffSStefano Zampini 1204a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 1205a13144ffSStefano Zampini if (marks[jj[j]] && marks[jj[j]] != eemax) { 1206c2151214SStefano Zampini SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_SUP,"Found 2 coarse edges (id %d and %d) connected through the %d nodal dof at edge dof %d\n",marks[jj[j]]-1,eemax,i,jj[j]); 1207a13144ffSStefano Zampini } 1208a13144ffSStefano Zampini } 1209a13144ffSStefano Zampini } 1210a13144ffSStefano Zampini ierr = PetscFree(emarks);CHKERRQ(ierr); 1211a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1212a13144ffSStefano Zampini #endif 1213a13144ffSStefano Zampini 1214a13144ffSStefano Zampini /* Compute extended rows indices for edge blocks of the change of basis */ 1215a13144ffSStefano Zampini ierr = MatGetRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1216a13144ffSStefano Zampini ierr = MatSeqAIJGetMaxRowNonzeros(lGt,&extmem);CHKERRQ(ierr); 1217a13144ffSStefano Zampini extmem *= maxsize; 1218a13144ffSStefano Zampini ierr = PetscMalloc1(extmem*nee,&extrow);CHKERRQ(ierr); 1219a13144ffSStefano Zampini ierr = PetscMalloc1(nee,&extrows);CHKERRQ(ierr); 1220a13144ffSStefano Zampini ierr = PetscCalloc1(nee,&extrowcum);CHKERRQ(ierr); 1221a13144ffSStefano Zampini for (i=0;i<nv;i++) { 1222a13144ffSStefano Zampini PetscInt mark = 0,size,start; 1223213b8bfaSStefano Zampini 1224a13144ffSStefano Zampini if (ii[i+1]==ii[i] || PetscBTLookup(btv,i)) continue; 1225a13144ffSStefano Zampini for (j=ii[i];j<ii[i+1];j++) 1226a13144ffSStefano Zampini if (marks[jj[j]] && !mark) 1227a13144ffSStefano Zampini mark = marks[jj[j]]; 1228a13144ffSStefano Zampini 1229a13144ffSStefano Zampini /* not relevant */ 1230a13144ffSStefano Zampini if (!mark) continue; 1231a13144ffSStefano Zampini 1232a13144ffSStefano Zampini /* import extended row */ 1233a13144ffSStefano Zampini mark--; 1234a13144ffSStefano Zampini start = mark*extmem+extrowcum[mark]; 1235a13144ffSStefano Zampini size = ii[i+1]-ii[i]; 1236a13144ffSStefano Zampini if (extrowcum[mark] + size > extmem) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Not enough memory allocated %d > %d",extrowcum[mark] + size,extmem); 1237a13144ffSStefano Zampini ierr = PetscMemcpy(extrow+start,jj+ii[i],size*sizeof(PetscInt));CHKERRQ(ierr); 1238a13144ffSStefano Zampini extrowcum[mark] += size; 1239a13144ffSStefano Zampini } 1240a13144ffSStefano Zampini ierr = MatRestoreRowIJ(lGt,0,PETSC_FALSE,PETSC_FALSE,&i,&ii,&jj,&done);CHKERRQ(ierr); 1241213b8bfaSStefano Zampini ierr = MatDestroy(&lGt);CHKERRQ(ierr); 1242213b8bfaSStefano Zampini ierr = PetscFree(marks);CHKERRQ(ierr); 1243213b8bfaSStefano Zampini 1244213b8bfaSStefano Zampini /* Compress extrows */ 1245a13144ffSStefano Zampini cum = 0; 1246a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1247a13144ffSStefano Zampini PetscInt size = extrowcum[i],*start = extrow + i*extmem; 1248a13144ffSStefano Zampini ierr = PetscSortRemoveDupsInt(&size,start);CHKERRQ(ierr); 1249a13144ffSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,size,start,PETSC_USE_POINTER,&extrows[i]);CHKERRQ(ierr); 1250a13144ffSStefano Zampini cum = PetscMax(cum,size); 1251a13144ffSStefano Zampini } 1252a13144ffSStefano Zampini ierr = PetscFree(extrowcum);CHKERRQ(ierr); 1253a13144ffSStefano Zampini ierr = PetscBTDestroy(&btv);CHKERRQ(ierr); 1254a13144ffSStefano Zampini ierr = PetscBTDestroy(&btvcand);CHKERRQ(ierr); 1255a13144ffSStefano Zampini 1256a13144ffSStefano Zampini /* Workspace for lapack inner calls and VecSetValues */ 1257a13144ffSStefano Zampini ierr = PetscMalloc2((5+cum+maxsize)*maxsize,&work,maxsize,&rwork);CHKERRQ(ierr); 1258a13144ffSStefano Zampini 1259a13144ffSStefano Zampini /* Create change of basis matrix (preallocation can be improved) */ 1260a13144ffSStefano Zampini ierr = MatCreate(comm,&T);CHKERRQ(ierr); 1261c2151214SStefano Zampini ierr = MatSetSizes(T,pc->pmat->rmap->n,pc->pmat->rmap->n, 1262c2151214SStefano Zampini pc->pmat->rmap->N,pc->pmat->rmap->N);CHKERRQ(ierr); 1263a13144ffSStefano Zampini ierr = MatSetType(T,MATAIJ);CHKERRQ(ierr); 1264a13144ffSStefano Zampini ierr = MatSeqAIJSetPreallocation(T,10,NULL);CHKERRQ(ierr); 1265a13144ffSStefano Zampini ierr = MatMPIAIJSetPreallocation(T,10,NULL,10,NULL);CHKERRQ(ierr); 12661e0482f5SStefano Zampini ierr = MatSetLocalToGlobalMapping(T,al2g,al2g);CHKERRQ(ierr); 1267a13144ffSStefano Zampini ierr = MatSetOption(T,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 1268a13144ffSStefano Zampini ierr = MatSetOption(T,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); 1269213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&al2g);CHKERRQ(ierr); 1270a13144ffSStefano Zampini 1271a13144ffSStefano Zampini /* Defaults to identity */ 1272c2151214SStefano Zampini ierr = MatCreateVecs(pc->pmat,&tvec,NULL);CHKERRQ(ierr); 1273a13144ffSStefano Zampini ierr = VecSet(tvec,1.0);CHKERRQ(ierr); 1274a13144ffSStefano Zampini ierr = MatDiagonalSet(T,tvec,INSERT_VALUES);CHKERRQ(ierr); 1275a13144ffSStefano Zampini ierr = VecDestroy(&tvec);CHKERRQ(ierr); 1276a13144ffSStefano Zampini 12771e0482f5SStefano Zampini /* Create discrete gradient for the coarser level if needed */ 12781e0482f5SStefano Zampini ierr = MatDestroy(&pcbddc->nedcG);CHKERRQ(ierr); 12791e0482f5SStefano Zampini ierr = ISDestroy(&pcbddc->nedclocal);CHKERRQ(ierr); 12801e0482f5SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) { 12811e0482f5SStefano Zampini ISLocalToGlobalMapping cel2g,cvl2g; 12821e0482f5SStefano Zampini IS wis,gwis; 12831e0482f5SStefano Zampini PetscInt cnv,cne; 12841e0482f5SStefano Zampini 12851e0482f5SStefano Zampini ierr = ISCreateGeneral(comm,nee,cedges,PETSC_COPY_VALUES,&wis);CHKERRQ(ierr); 12861e0482f5SStefano Zampini if (fl2g) { 12871e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(fl2g,wis,&pcbddc->nedclocal);CHKERRQ(ierr); 12881e0482f5SStefano Zampini } else { 12891e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)wis);CHKERRQ(ierr); 12901e0482f5SStefano Zampini pcbddc->nedclocal = wis; 12911e0482f5SStefano Zampini } 12921e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(el2g,wis,&gwis);CHKERRQ(ierr); 12931e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 12941e0482f5SStefano Zampini ierr = ISRenumber(gwis,NULL,&cne,&wis);CHKERRQ(ierr); 12951e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(wis,&cel2g);CHKERRQ(ierr); 12961e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 12971e0482f5SStefano Zampini ierr = ISDestroy(&gwis);CHKERRQ(ierr); 12981e0482f5SStefano Zampini 12991e0482f5SStefano Zampini ierr = ISCreateGeneral(comm,2*nee,corners,PETSC_USE_POINTER,&wis);CHKERRQ(ierr); 13001e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(vl2g,wis,&gwis);CHKERRQ(ierr); 13011e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 13021e0482f5SStefano Zampini ierr = ISRenumber(gwis,NULL,&cnv,&wis);CHKERRQ(ierr); 13031e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(wis,&cvl2g);CHKERRQ(ierr); 13041e0482f5SStefano Zampini ierr = ISDestroy(&wis);CHKERRQ(ierr); 13051e0482f5SStefano Zampini ierr = ISDestroy(&gwis);CHKERRQ(ierr); 13061e0482f5SStefano Zampini 13071e0482f5SStefano Zampini ierr = MatCreate(comm,&pcbddc->nedcG);CHKERRQ(ierr); 13081e0482f5SStefano Zampini ierr = MatSetSizes(pcbddc->nedcG,PETSC_DECIDE,PETSC_DECIDE,cne,cnv);CHKERRQ(ierr); 13091e0482f5SStefano Zampini ierr = MatSetType(pcbddc->nedcG,MATAIJ);CHKERRQ(ierr); 13101e0482f5SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->nedcG,2,NULL);CHKERRQ(ierr); 13111e0482f5SStefano Zampini ierr = MatMPIAIJSetPreallocation(pcbddc->nedcG,2,NULL,2,NULL);CHKERRQ(ierr); 13121e0482f5SStefano Zampini ierr = MatSetLocalToGlobalMapping(pcbddc->nedcG,cel2g,cvl2g);CHKERRQ(ierr); 13131e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cel2g);CHKERRQ(ierr); 13141e0482f5SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cvl2g);CHKERRQ(ierr); 13151e0482f5SStefano Zampini } 1316213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&vl2g);CHKERRQ(ierr); 13171e0482f5SStefano Zampini 13181e0482f5SStefano Zampini #if defined(PRINT_GDET) 13191e0482f5SStefano Zampini inc = 0; 13201e0482f5SStefano Zampini lev = pcbddc->current_level; 13211e0482f5SStefano Zampini #endif 1322213b8bfaSStefano Zampini 1323213b8bfaSStefano Zampini /* Insert values in the change of basis matrix */ 1324a13144ffSStefano Zampini for (i=0;i<nee;i++) { 1325a13144ffSStefano Zampini Mat Gins = NULL, GKins = NULL; 13261e0482f5SStefano Zampini IS cornersis = NULL; 13271e0482f5SStefano Zampini PetscScalar cvals[2]; 1328a13144ffSStefano Zampini 13291e0482f5SStefano Zampini if (pcbddc->nedcG) { 13301e0482f5SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,2,corners+2*i,PETSC_USE_POINTER,&cornersis);CHKERRQ(ierr); 13311e0482f5SStefano Zampini } 13321e0482f5SStefano Zampini ierr = PCBDDCComputeNedelecChangeEdge(lG,eedges[i],extrows[i],extcols[i],cornersis,&Gins,&GKins,cvals,work,rwork);CHKERRQ(ierr); 1333a13144ffSStefano Zampini if (Gins && GKins) { 1334a13144ffSStefano Zampini PetscScalar *data; 1335a13144ffSStefano Zampini const PetscInt *rows,*cols; 1336a13144ffSStefano Zampini PetscInt nrh,nch,nrc,ncc; 1337a13144ffSStefano Zampini 1338a13144ffSStefano Zampini ierr = ISGetIndices(eedges[i],&cols);CHKERRQ(ierr); 1339a13144ffSStefano Zampini /* H1 */ 1340a13144ffSStefano Zampini ierr = ISGetIndices(extrows[i],&rows);CHKERRQ(ierr); 1341a13144ffSStefano Zampini ierr = MatGetSize(Gins,&nrh,&nch);CHKERRQ(ierr); 1342a13144ffSStefano Zampini ierr = MatDenseGetArray(Gins,&data);CHKERRQ(ierr); 1343a13144ffSStefano Zampini ierr = MatSetValuesLocal(T,nrh,rows,nch,cols,data,INSERT_VALUES);CHKERRQ(ierr); 1344a13144ffSStefano Zampini ierr = MatDenseRestoreArray(Gins,&data);CHKERRQ(ierr); 1345a13144ffSStefano Zampini ierr = ISRestoreIndices(extrows[i],&rows);CHKERRQ(ierr); 1346a13144ffSStefano Zampini /* complement */ 1347a13144ffSStefano Zampini ierr = MatGetSize(GKins,&nrc,&ncc);CHKERRQ(ierr); 13481e0482f5SStefano Zampini if (!ncc) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Constant function has not been generated for coarse edge %d",i); 1349213b8bfaSStefano Zampini if (ncc + nch != nrc) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"The sum of the number of columns of GKins %d and Gins %d does not match %d for coarse edge %d",ncc,nch,nrc,i); 1350213b8bfaSStefano Zampini if (ncc != 1 && pcbddc->nedcG) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot generate the coarse discrete gradient for coarse edge %d with ncc %d",i,ncc); 1351a13144ffSStefano Zampini ierr = MatDenseGetArray(GKins,&data);CHKERRQ(ierr); 1352a13144ffSStefano Zampini ierr = MatSetValuesLocal(T,nrc,cols,ncc,cols+nch,data,INSERT_VALUES);CHKERRQ(ierr); 1353a13144ffSStefano Zampini ierr = MatDenseRestoreArray(GKins,&data);CHKERRQ(ierr); 13541e0482f5SStefano Zampini 13551e0482f5SStefano Zampini /* coarse discrete gradient */ 13561e0482f5SStefano Zampini if (pcbddc->nedcG) { 13571e0482f5SStefano Zampini PetscInt cols[2]; 13581e0482f5SStefano Zampini 13591e0482f5SStefano Zampini cols[0] = 2*i; 13601e0482f5SStefano Zampini cols[1] = 2*i+1; 13611e0482f5SStefano Zampini ierr = MatSetValuesLocal(pcbddc->nedcG,1,&i,2,cols,cvals,INSERT_VALUES);CHKERRQ(ierr); 13621e0482f5SStefano Zampini } 1363a13144ffSStefano Zampini ierr = ISRestoreIndices(eedges[i],&cols);CHKERRQ(ierr); 1364a13144ffSStefano Zampini } 1365a13144ffSStefano Zampini ierr = ISDestroy(&extrows[i]);CHKERRQ(ierr); 1366a13144ffSStefano Zampini ierr = ISDestroy(&extcols[i]);CHKERRQ(ierr); 13671e0482f5SStefano Zampini ierr = ISDestroy(&cornersis);CHKERRQ(ierr); 1368a13144ffSStefano Zampini ierr = MatDestroy(&Gins);CHKERRQ(ierr); 1369a13144ffSStefano Zampini ierr = MatDestroy(&GKins);CHKERRQ(ierr); 1370a13144ffSStefano Zampini } 1371213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&el2g);CHKERRQ(ierr); 1372a13144ffSStefano Zampini 1373a13144ffSStefano Zampini /* Start assembling */ 1374a13144ffSStefano Zampini ierr = MatAssemblyBegin(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13751e0482f5SStefano Zampini if (pcbddc->nedcG) { 13761e0482f5SStefano Zampini ierr = MatAssemblyBegin(pcbddc->nedcG,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13771e0482f5SStefano Zampini } 1378a13144ffSStefano Zampini 1379a13144ffSStefano Zampini /* Free */ 1380c2151214SStefano Zampini if (fl2g) { 1381c2151214SStefano Zampini ierr = ISDestroy(&primals);CHKERRQ(ierr); 1382c2151214SStefano Zampini for (i=0;i<nee;i++) { 1383c2151214SStefano Zampini ierr = ISDestroy(&eedges[i]);CHKERRQ(ierr); 1384c2151214SStefano Zampini } 1385c2151214SStefano Zampini ierr = PetscFree(eedges);CHKERRQ(ierr); 1386c2151214SStefano Zampini } 1387eee23b56SStefano Zampini 1388eee23b56SStefano Zampini /* hack mat_graph with primal dofs on the coarse edges */ 1389eee23b56SStefano Zampini { 1390eee23b56SStefano Zampini PCBDDCGraph graph = pcbddc->mat_graph; 1391eee23b56SStefano Zampini PetscInt *oqueue = graph->queue; 1392eee23b56SStefano Zampini PetscInt *ocptr = graph->cptr; 1393eee23b56SStefano Zampini PetscInt ncc,*idxs; 1394eee23b56SStefano Zampini 1395eee23b56SStefano Zampini /* find first primal edge */ 1396eee23b56SStefano Zampini if (pcbddc->nedclocal) { 1397eee23b56SStefano Zampini ierr = ISGetIndices(pcbddc->nedclocal,(const PetscInt**)&idxs);CHKERRQ(ierr); 1398eee23b56SStefano Zampini } else { 1399eee23b56SStefano Zampini if (fl2g) { 1400eee23b56SStefano Zampini ierr = ISLocalToGlobalMappingApply(fl2g,nee,cedges,cedges);CHKERRQ(ierr); 1401eee23b56SStefano Zampini } 1402eee23b56SStefano Zampini idxs = cedges; 1403eee23b56SStefano Zampini } 1404eee23b56SStefano Zampini cum = 0; 1405eee23b56SStefano Zampini while (cum < nee && cedges[cum] < 0) cum++; 1406eee23b56SStefano Zampini 1407eee23b56SStefano Zampini /* adapt connected components */ 1408eee23b56SStefano Zampini ierr = PetscMalloc2(graph->nvtxs+1,&graph->cptr,ocptr[graph->ncc],&graph->queue);CHKERRQ(ierr); 1409eee23b56SStefano Zampini graph->cptr[0] = 0; 1410eee23b56SStefano Zampini for (i=0,ncc=0;i<graph->ncc;i++) { 1411eee23b56SStefano Zampini PetscInt lc = ocptr[i+1]-ocptr[i]; 1412eee23b56SStefano Zampini if (cum != nee && oqueue[ocptr[i+1]-1] == cedges[cum]) { /* this cc has a primal dof */ 1413eee23b56SStefano Zampini graph->cptr[ncc+1] = graph->cptr[ncc]+1; 1414eee23b56SStefano Zampini graph->queue[graph->cptr[ncc]] = cedges[cum]; 1415eee23b56SStefano Zampini ncc++; 1416eee23b56SStefano Zampini lc--; 1417eee23b56SStefano Zampini cum++; 1418eee23b56SStefano Zampini while (cum < nee && cedges[cum] < 0) cum++; 1419eee23b56SStefano Zampini } 1420eee23b56SStefano Zampini graph->cptr[ncc+1] = graph->cptr[ncc] + lc; 1421eee23b56SStefano Zampini for (j=0;j<lc;j++) graph->queue[graph->cptr[ncc]+j] = oqueue[ocptr[i]+j]; 1422eee23b56SStefano Zampini ncc++; 1423eee23b56SStefano Zampini } 1424eee23b56SStefano Zampini graph->ncc = ncc; 1425eee23b56SStefano Zampini if (pcbddc->nedclocal) { 1426eee23b56SStefano Zampini ierr = ISRestoreIndices(pcbddc->nedclocal,(const PetscInt**)&idxs);CHKERRQ(ierr); 1427eee23b56SStefano Zampini } 1428eee23b56SStefano Zampini ierr = PetscFree2(ocptr,oqueue);CHKERRQ(ierr); 1429eee23b56SStefano Zampini } 1430213b8bfaSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&fl2g);CHKERRQ(ierr); 1431c2151214SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,&nee,&alleedges,&allprimals);CHKERRQ(ierr); 1432c2151214SStefano Zampini ierr = PCBDDCGraphResetCSR(pcbddc->mat_graph);CHKERRQ(ierr); 1433213b8bfaSStefano Zampini ierr = MatDestroy(&conn);CHKERRQ(ierr); 1434eee23b56SStefano Zampini 1435c2151214SStefano Zampini ierr = ISDestroy(&nedfieldlocal);CHKERRQ(ierr); 1436a13144ffSStefano Zampini ierr = PetscFree(extrow);CHKERRQ(ierr); 1437a13144ffSStefano Zampini ierr = PetscFree2(work,rwork);CHKERRQ(ierr); 1438b03ebc13SStefano Zampini ierr = PetscFree(corners);CHKERRQ(ierr); 1439b03ebc13SStefano Zampini ierr = PetscFree(cedges);CHKERRQ(ierr); 1440a13144ffSStefano Zampini ierr = PetscFree(extrows);CHKERRQ(ierr); 1441a13144ffSStefano Zampini ierr = PetscFree(extcols);CHKERRQ(ierr); 1442a13144ffSStefano Zampini ierr = MatDestroy(&lG);CHKERRQ(ierr); 1443a13144ffSStefano Zampini 1444a13144ffSStefano Zampini /* Complete assembling */ 1445a13144ffSStefano Zampini ierr = MatAssemblyEnd(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14461e0482f5SStefano Zampini if (pcbddc->nedcG) { 14471e0482f5SStefano Zampini ierr = MatAssemblyEnd(pcbddc->nedcG,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14481e0482f5SStefano Zampini #if 0 14491e0482f5SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->nedcG,"coarse_G");CHKERRQ(ierr); 14501e0482f5SStefano Zampini ierr = MatView(pcbddc->nedcG,NULL);CHKERRQ(ierr); 14511e0482f5SStefano Zampini #endif 14521e0482f5SStefano Zampini } 1453a13144ffSStefano Zampini 1454a13144ffSStefano Zampini /* set change of basis */ 1455213b8bfaSStefano Zampini ierr = PCBDDCSetChangeOfBasisMat(pc,T,singular);CHKERRQ(ierr); 1456a13144ffSStefano Zampini ierr = MatDestroy(&T);CHKERRQ(ierr); 1457a13144ffSStefano Zampini 1458a13144ffSStefano Zampini PetscFunctionReturn(0); 1459a13144ffSStefano Zampini } 1460a13144ffSStefano Zampini 1461d8203eabSStefano Zampini /* the near-null space of BDDC carries information on quadrature weights, 1462d8203eabSStefano Zampini and these can be collinear -> so cheat with MatNullSpaceCreate 1463d8203eabSStefano Zampini and create a suitable set of basis vectors first */ 1464d8203eabSStefano Zampini PetscErrorCode PCBDDCNullSpaceCreate(MPI_Comm comm, PetscBool has_const, PetscInt nvecs, Vec quad_vecs[], MatNullSpace *nnsp) 1465d8203eabSStefano Zampini { 1466d8203eabSStefano Zampini PetscErrorCode ierr; 1467d8203eabSStefano Zampini PetscInt i; 1468d8203eabSStefano Zampini 1469d8203eabSStefano Zampini PetscFunctionBegin; 1470d8203eabSStefano Zampini for (i=0;i<nvecs;i++) { 1471d8203eabSStefano Zampini PetscInt first,last; 1472d8203eabSStefano Zampini 1473d8203eabSStefano Zampini ierr = VecGetOwnershipRange(quad_vecs[i],&first,&last);CHKERRQ(ierr); 147486fa73c5SStefano Zampini if (last-first < 2*nvecs && has_const) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented"); 1475d8203eabSStefano Zampini if (i>=first && i < last) { 1476d8203eabSStefano Zampini PetscScalar *data; 1477d8203eabSStefano Zampini ierr = VecGetArray(quad_vecs[i],&data);CHKERRQ(ierr); 1478d8203eabSStefano Zampini if (!has_const) { 1479d8203eabSStefano Zampini data[i-first] = 1.; 1480d8203eabSStefano Zampini } else { 148186fa73c5SStefano Zampini data[2*i-first] = 1./PetscSqrtReal(2.); 148286fa73c5SStefano Zampini data[2*i-first+1] = -1./PetscSqrtReal(2.); 1483d8203eabSStefano Zampini } 1484d8203eabSStefano Zampini ierr = VecRestoreArray(quad_vecs[i],&data);CHKERRQ(ierr); 1485d8203eabSStefano Zampini } 1486d8203eabSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)quad_vecs[i]);CHKERRQ(ierr); 1487d8203eabSStefano Zampini } 1488d8203eabSStefano Zampini ierr = MatNullSpaceCreate(comm,has_const,nvecs,quad_vecs,nnsp);CHKERRQ(ierr); 1489d8203eabSStefano Zampini for (i=0;i<nvecs;i++) { /* reset vectors */ 1490d8203eabSStefano Zampini PetscInt first,last; 1491ddc40e2cSstefano_zampini ierr = VecLockPop(quad_vecs[i]);CHKERRQ(ierr); 1492d8203eabSStefano Zampini ierr = VecGetOwnershipRange(quad_vecs[i],&first,&last);CHKERRQ(ierr); 1493d8203eabSStefano Zampini if (i>=first && i < last) { 1494d8203eabSStefano Zampini PetscScalar *data; 1495d8203eabSStefano Zampini ierr = VecGetArray(quad_vecs[i],&data);CHKERRQ(ierr); 1496d8203eabSStefano Zampini if (!has_const) { 1497d8203eabSStefano Zampini data[i-first] = 0.; 1498d8203eabSStefano Zampini } else { 149986fa73c5SStefano Zampini data[2*i-first] = 0.; 150086fa73c5SStefano Zampini data[2*i-first+1] = 0.; 1501d8203eabSStefano Zampini } 1502d8203eabSStefano Zampini ierr = VecRestoreArray(quad_vecs[i],&data);CHKERRQ(ierr); 1503d8203eabSStefano Zampini } 1504d8203eabSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)quad_vecs[i]);CHKERRQ(ierr); 1505ddc40e2cSstefano_zampini ierr = VecLockPush(quad_vecs[i]);CHKERRQ(ierr); 1506d8203eabSStefano Zampini } 1507d8203eabSStefano Zampini PetscFunctionReturn(0); 1508d8203eabSStefano Zampini } 1509d8203eabSStefano Zampini 15108ae0ca82SStefano Zampini PetscErrorCode PCBDDCComputeNoNetFlux(Mat A, Mat divudotp, PetscBool transpose, IS vl2l, PCBDDCGraph graph, MatNullSpace *nnsp) 1511669cc0f4SStefano Zampini { 1512a198735bSStefano Zampini Mat loc_divudotp; 1513fa23a32eSStefano Zampini Vec p,v,vins,quad_vec,*quad_vecs; 15148ae0ca82SStefano Zampini ISLocalToGlobalMapping map; 1515669cc0f4SStefano Zampini IS *faces,*edges; 1516669cc0f4SStefano Zampini PetscScalar *vals; 1517669cc0f4SStefano Zampini const PetscScalar *array; 1518669cc0f4SStefano Zampini PetscInt i,maxneighs,lmaxneighs,maxsize,nf,ne; 15191ae86dd6SStefano Zampini PetscMPIInt rank; 1520a198735bSStefano Zampini PetscErrorCode ierr; 1521669cc0f4SStefano Zampini 1522669cc0f4SStefano Zampini PetscFunctionBegin; 1523669cc0f4SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(graph,&nf,&faces,&ne,&edges,NULL);CHKERRQ(ierr); 1524669cc0f4SStefano Zampini if (graph->twodim) { 1525669cc0f4SStefano Zampini lmaxneighs = 2; 1526669cc0f4SStefano Zampini } else { 1527669cc0f4SStefano Zampini lmaxneighs = 1; 1528669cc0f4SStefano Zampini for (i=0;i<ne;i++) { 1529669cc0f4SStefano Zampini const PetscInt *idxs; 1530669cc0f4SStefano Zampini ierr = ISGetIndices(edges[i],&idxs);CHKERRQ(ierr); 1531669cc0f4SStefano Zampini lmaxneighs = PetscMax(lmaxneighs,graph->count[idxs[0]]); 1532669cc0f4SStefano Zampini ierr = ISRestoreIndices(edges[i],&idxs);CHKERRQ(ierr); 1533669cc0f4SStefano Zampini } 1534669cc0f4SStefano Zampini lmaxneighs++; /* graph count does not include self */ 1535669cc0f4SStefano Zampini } 1536669cc0f4SStefano Zampini ierr = MPIU_Allreduce(&lmaxneighs,&maxneighs,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)A));CHKERRQ(ierr); 1537669cc0f4SStefano Zampini maxsize = 0; 1538669cc0f4SStefano Zampini for (i=0;i<ne;i++) { 1539669cc0f4SStefano Zampini PetscInt nn; 1540669cc0f4SStefano Zampini ierr = ISGetLocalSize(edges[i],&nn);CHKERRQ(ierr); 1541669cc0f4SStefano Zampini maxsize = PetscMax(maxsize,nn); 1542669cc0f4SStefano Zampini } 1543669cc0f4SStefano Zampini for (i=0;i<nf;i++) { 1544669cc0f4SStefano Zampini PetscInt nn; 1545669cc0f4SStefano Zampini ierr = ISGetLocalSize(faces[i],&nn);CHKERRQ(ierr); 1546669cc0f4SStefano Zampini maxsize = PetscMax(maxsize,nn); 1547669cc0f4SStefano Zampini } 1548669cc0f4SStefano Zampini ierr = PetscMalloc1(maxsize,&vals);CHKERRQ(ierr); 1549669cc0f4SStefano Zampini /* create vectors to hold quadrature weights */ 1550669cc0f4SStefano Zampini ierr = MatCreateVecs(A,&quad_vec,NULL);CHKERRQ(ierr); 15518ae0ca82SStefano Zampini if (!transpose) { 15528ae0ca82SStefano Zampini ierr = MatGetLocalToGlobalMapping(A,&map,NULL);CHKERRQ(ierr); 15538ae0ca82SStefano Zampini } else { 15548ae0ca82SStefano Zampini ierr = MatGetLocalToGlobalMapping(A,NULL,&map);CHKERRQ(ierr); 15558ae0ca82SStefano Zampini } 1556669cc0f4SStefano Zampini ierr = VecDuplicateVecs(quad_vec,maxneighs,&quad_vecs);CHKERRQ(ierr); 15571ae86dd6SStefano Zampini ierr = VecDestroy(&quad_vec);CHKERRQ(ierr); 1558d8203eabSStefano Zampini ierr = PCBDDCNullSpaceCreate(PetscObjectComm((PetscObject)A),PETSC_FALSE,maxneighs,quad_vecs,nnsp);CHKERRQ(ierr); 1559669cc0f4SStefano Zampini for (i=0;i<maxneighs;i++) { 1560ddc40e2cSstefano_zampini ierr = VecLockPop(quad_vecs[i]);CHKERRQ(ierr); 15618ae0ca82SStefano Zampini ierr = VecSetLocalToGlobalMapping(quad_vecs[i],map);CHKERRQ(ierr); 1562669cc0f4SStefano Zampini } 1563d8203eabSStefano Zampini 1564669cc0f4SStefano Zampini /* compute local quad vec */ 1565a198735bSStefano Zampini ierr = MatISGetLocalMat(divudotp,&loc_divudotp);CHKERRQ(ierr); 15668ae0ca82SStefano Zampini if (!transpose) { 1567a198735bSStefano Zampini ierr = MatCreateVecs(loc_divudotp,&v,&p);CHKERRQ(ierr); 15688ae0ca82SStefano Zampini } else { 15698ae0ca82SStefano Zampini ierr = MatCreateVecs(loc_divudotp,&p,&v);CHKERRQ(ierr); 15708ae0ca82SStefano Zampini } 1571669cc0f4SStefano Zampini ierr = VecSet(p,1.);CHKERRQ(ierr); 15728ae0ca82SStefano Zampini if (!transpose) { 1573a198735bSStefano Zampini ierr = MatMultTranspose(loc_divudotp,p,v);CHKERRQ(ierr); 15748ae0ca82SStefano Zampini } else { 15758ae0ca82SStefano Zampini ierr = MatMult(loc_divudotp,p,v);CHKERRQ(ierr); 15768ae0ca82SStefano Zampini } 1577fa23a32eSStefano Zampini if (vl2l) { 1578187c917aSStefano Zampini Mat lA; 1579187c917aSStefano Zampini VecScatter sc; 1580187c917aSStefano Zampini 1581187c917aSStefano Zampini ierr = MatISGetLocalMat(A,&lA);CHKERRQ(ierr); 1582187c917aSStefano Zampini ierr = MatCreateVecs(lA,&vins,NULL);CHKERRQ(ierr); 1583187c917aSStefano Zampini ierr = VecScatterCreate(v,vl2l,vins,NULL,&sc);CHKERRQ(ierr); 1584187c917aSStefano Zampini ierr = VecScatterBegin(sc,v,vins,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1585187c917aSStefano Zampini ierr = VecScatterEnd(sc,v,vins,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1586187c917aSStefano Zampini ierr = VecScatterDestroy(&sc);CHKERRQ(ierr); 1587fa23a32eSStefano Zampini } else { 1588fa23a32eSStefano Zampini vins = v; 1589fa23a32eSStefano Zampini } 1590fa23a32eSStefano Zampini ierr = VecGetArrayRead(vins,&array);CHKERRQ(ierr); 1591669cc0f4SStefano Zampini ierr = VecDestroy(&p);CHKERRQ(ierr); 15929a962809SStefano Zampini 15931ae86dd6SStefano Zampini /* insert in global quadrature vecs */ 15941ae86dd6SStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A),&rank);CHKERRQ(ierr); 1595669cc0f4SStefano Zampini for (i=0;i<nf;i++) { 1596669cc0f4SStefano Zampini const PetscInt *idxs; 1597669cc0f4SStefano Zampini PetscInt idx,nn,j; 1598669cc0f4SStefano Zampini 1599669cc0f4SStefano Zampini ierr = ISGetIndices(faces[i],&idxs);CHKERRQ(ierr); 1600669cc0f4SStefano Zampini ierr = ISGetLocalSize(faces[i],&nn);CHKERRQ(ierr); 1601669cc0f4SStefano Zampini for (j=0;j<nn;j++) vals[j] = array[idxs[j]]; 16021ae86dd6SStefano Zampini ierr = PetscFindInt(rank,graph->count[idxs[0]],graph->neighbours_set[idxs[0]],&idx);CHKERRQ(ierr); 1603669cc0f4SStefano Zampini idx = -(idx+1); 1604669cc0f4SStefano Zampini ierr = VecSetValuesLocal(quad_vecs[idx],nn,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 1605669cc0f4SStefano Zampini ierr = ISRestoreIndices(faces[i],&idxs);CHKERRQ(ierr); 1606669cc0f4SStefano Zampini } 1607669cc0f4SStefano Zampini for (i=0;i<ne;i++) { 1608669cc0f4SStefano Zampini const PetscInt *idxs; 1609669cc0f4SStefano Zampini PetscInt idx,nn,j; 1610669cc0f4SStefano Zampini 1611669cc0f4SStefano Zampini ierr = ISGetIndices(edges[i],&idxs);CHKERRQ(ierr); 1612669cc0f4SStefano Zampini ierr = ISGetLocalSize(edges[i],&nn);CHKERRQ(ierr); 1613669cc0f4SStefano Zampini for (j=0;j<nn;j++) vals[j] = array[idxs[j]]; 16141ae86dd6SStefano Zampini ierr = PetscFindInt(rank,graph->count[idxs[0]],graph->neighbours_set[idxs[0]],&idx);CHKERRQ(ierr); 1615669cc0f4SStefano Zampini idx = -(idx+1); 1616669cc0f4SStefano Zampini ierr = VecSetValuesLocal(quad_vecs[idx],nn,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 1617669cc0f4SStefano Zampini ierr = ISRestoreIndices(edges[i],&idxs);CHKERRQ(ierr); 1618669cc0f4SStefano Zampini } 1619c8272957SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(graph,&nf,&faces,&ne,&edges,NULL);CHKERRQ(ierr); 1620fa23a32eSStefano Zampini ierr = VecRestoreArrayRead(vins,&array);CHKERRQ(ierr); 1621fa23a32eSStefano Zampini if (vl2l) { 1622187c917aSStefano Zampini ierr = VecDestroy(&vins);CHKERRQ(ierr); 1623fa23a32eSStefano Zampini } 1624669cc0f4SStefano Zampini ierr = VecDestroy(&v);CHKERRQ(ierr); 1625669cc0f4SStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 1626669cc0f4SStefano Zampini 1627669cc0f4SStefano Zampini /* assemble near null space */ 1628669cc0f4SStefano Zampini for (i=0;i<maxneighs;i++) { 1629669cc0f4SStefano Zampini ierr = VecAssemblyBegin(quad_vecs[i]);CHKERRQ(ierr); 1630669cc0f4SStefano Zampini } 1631669cc0f4SStefano Zampini for (i=0;i<maxneighs;i++) { 1632669cc0f4SStefano Zampini ierr = VecAssemblyEnd(quad_vecs[i]);CHKERRQ(ierr); 1633ddc40e2cSstefano_zampini ierr = VecLockPush(quad_vecs[i]);CHKERRQ(ierr); 1634669cc0f4SStefano Zampini } 1635669cc0f4SStefano Zampini ierr = VecDestroyVecs(maxneighs,&quad_vecs);CHKERRQ(ierr); 1636669cc0f4SStefano Zampini PetscFunctionReturn(0); 1637669cc0f4SStefano Zampini } 1638669cc0f4SStefano Zampini 1639669cc0f4SStefano Zampini 16401f4df5f7SStefano Zampini PetscErrorCode PCBDDCComputeLocalTopologyInfo(PC pc) 16411f4df5f7SStefano Zampini { 16421f4df5f7SStefano Zampini PetscErrorCode ierr; 16431f4df5f7SStefano Zampini Vec local,global; 16441f4df5f7SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 16451f4df5f7SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 16465c5e10d6SStefano Zampini PetscBool monolithic = PETSC_FALSE; 16471f4df5f7SStefano Zampini 16481f4df5f7SStefano Zampini PetscFunctionBegin; 16495c5e10d6SStefano Zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC topology options","PC");CHKERRQ(ierr); 16505c5e10d6SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_monolithic","Discard any information on dofs splitting",NULL,monolithic,&monolithic,NULL);CHKERRQ(ierr); 16515c5e10d6SStefano Zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 16521f4df5f7SStefano Zampini /* need to convert from global to local topology information and remove references to information in global ordering */ 165321ef3d20SStefano Zampini ierr = MatCreateVecs(pc->pmat,&global,NULL);CHKERRQ(ierr); 16541f4df5f7SStefano Zampini ierr = MatCreateVecs(matis->A,&local,NULL);CHKERRQ(ierr); 16555c5e10d6SStefano Zampini if (monolithic) goto boundary; 16565c5e10d6SStefano Zampini 16571f4df5f7SStefano Zampini if (pcbddc->user_provided_isfordofs) { 16581f4df5f7SStefano Zampini if (pcbddc->n_ISForDofs) { 16591f4df5f7SStefano Zampini PetscInt i; 16601f4df5f7SStefano Zampini ierr = PetscMalloc1(pcbddc->n_ISForDofs,&pcbddc->ISForDofsLocal);CHKERRQ(ierr); 16611f4df5f7SStefano Zampini for (i=0;i<pcbddc->n_ISForDofs;i++) { 16621f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->ISForDofs[i],&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 16631f4df5f7SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 16641f4df5f7SStefano Zampini } 16651f4df5f7SStefano Zampini pcbddc->n_ISForDofsLocal = pcbddc->n_ISForDofs; 16661f4df5f7SStefano Zampini pcbddc->n_ISForDofs = 0; 16671f4df5f7SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 16681f4df5f7SStefano Zampini } 16691f4df5f7SStefano Zampini } else { 167021ef3d20SStefano Zampini if (!pcbddc->n_ISForDofsLocal) { /* field split not present */ 167121ef3d20SStefano Zampini DM dm; 167221ef3d20SStefano Zampini 167321ef3d20SStefano Zampini ierr = PCGetDM(pc, &dm);CHKERRQ(ierr); 167421ef3d20SStefano Zampini if (!dm) { 167521ef3d20SStefano Zampini ierr = MatGetDM(pc->pmat, &dm);CHKERRQ(ierr); 167621ef3d20SStefano Zampini } 167721ef3d20SStefano Zampini if (dm) { 167821ef3d20SStefano Zampini IS *fields; 167921ef3d20SStefano Zampini PetscInt nf,i; 168021ef3d20SStefano Zampini ierr = DMCreateFieldDecomposition(dm,&nf,NULL,&fields,NULL);CHKERRQ(ierr); 168121ef3d20SStefano Zampini ierr = PetscMalloc1(nf,&pcbddc->ISForDofsLocal);CHKERRQ(ierr); 168221ef3d20SStefano Zampini for (i=0;i<nf;i++) { 168321ef3d20SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,fields[i],&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 168421ef3d20SStefano Zampini ierr = ISDestroy(&fields[i]);CHKERRQ(ierr); 168521ef3d20SStefano Zampini } 168621ef3d20SStefano Zampini ierr = PetscFree(fields);CHKERRQ(ierr); 168721ef3d20SStefano Zampini pcbddc->n_ISForDofsLocal = nf; 168821ef3d20SStefano Zampini } else { /* See if MATIS has fields attached by the conversion from MatNest */ 168921ef3d20SStefano Zampini PetscContainer c; 169021ef3d20SStefano Zampini 169121ef3d20SStefano Zampini ierr = PetscObjectQuery((PetscObject)pc->pmat,"_convert_nest_lfields",(PetscObject*)&c);CHKERRQ(ierr); 169221ef3d20SStefano Zampini if (c) { 169321ef3d20SStefano Zampini MatISLocalFields lf; 169421ef3d20SStefano Zampini ierr = PetscContainerGetPointer(c,(void**)&lf);CHKERRQ(ierr); 169521ef3d20SStefano Zampini ierr = PCBDDCSetDofsSplittingLocal(pc,lf->nr,lf->rf);CHKERRQ(ierr); 169621ef3d20SStefano Zampini } else { /* fallback, create the default fields if bs > 1 */ 16971f4df5f7SStefano Zampini PetscInt i, n = matis->A->rmap->n; 1698986cdee1SStefano Zampini ierr = MatGetBlockSize(pc->pmat,&i);CHKERRQ(ierr); 169921ef3d20SStefano Zampini if (i > 1) { 1700986cdee1SStefano Zampini pcbddc->n_ISForDofsLocal = i; 17011f4df5f7SStefano Zampini ierr = PetscMalloc1(pcbddc->n_ISForDofsLocal,&pcbddc->ISForDofsLocal);CHKERRQ(ierr); 17021f4df5f7SStefano Zampini for (i=0;i<pcbddc->n_ISForDofsLocal;i++) { 17031f4df5f7SStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n/pcbddc->n_ISForDofsLocal,i,pcbddc->n_ISForDofsLocal,&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 17041f4df5f7SStefano Zampini } 17051f4df5f7SStefano Zampini } 170621ef3d20SStefano Zampini } 170721ef3d20SStefano Zampini } 17087a0e7b2cSstefano_zampini } else { 17097a0e7b2cSstefano_zampini PetscInt i; 17107a0e7b2cSstefano_zampini for (i=0;i<pcbddc->n_ISForDofsLocal;i++) { 17117a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LAND,&pcbddc->ISForDofsLocal[i]);CHKERRQ(ierr); 17127a0e7b2cSstefano_zampini } 17131f4df5f7SStefano Zampini } 1714986cdee1SStefano Zampini } 17151f4df5f7SStefano Zampini 17165c5e10d6SStefano Zampini boundary: 17171f4df5f7SStefano Zampini if (!pcbddc->DirichletBoundariesLocal && pcbddc->DirichletBoundaries) { 17181f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->DirichletBoundaries,&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr); 17197a0e7b2cSstefano_zampini } else if (pcbddc->DirichletBoundariesLocal) { 17207a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LAND,&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr); 17211f4df5f7SStefano Zampini } 17221f4df5f7SStefano Zampini if (!pcbddc->NeumannBoundariesLocal && pcbddc->NeumannBoundaries) { 17231f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->NeumannBoundaries,&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr); 17247a0e7b2cSstefano_zampini } else if (pcbddc->NeumannBoundariesLocal) { 17257a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LOR,&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr); 17261f4df5f7SStefano Zampini } 17271f4df5f7SStefano Zampini if (!pcbddc->user_primal_vertices_local && pcbddc->user_primal_vertices) { 17281f4df5f7SStefano Zampini ierr = PCBDDCGlobalToLocal(matis->rctx,global,local,pcbddc->user_primal_vertices,&pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 17291f4df5f7SStefano Zampini } 17301f4df5f7SStefano Zampini ierr = VecDestroy(&global);CHKERRQ(ierr); 17311f4df5f7SStefano Zampini ierr = VecDestroy(&local);CHKERRQ(ierr); 17327a0e7b2cSstefano_zampini 17337a0e7b2cSstefano_zampini PetscFunctionReturn(0); 17347a0e7b2cSstefano_zampini } 17357a0e7b2cSstefano_zampini 17367a0e7b2cSstefano_zampini PetscErrorCode PCBDDCConsistencyCheckIS(PC pc, MPI_Op mop, IS *is) 17377a0e7b2cSstefano_zampini { 17387a0e7b2cSstefano_zampini Mat_IS *matis = (Mat_IS*)(pc->pmat->data); 17397a0e7b2cSstefano_zampini PetscErrorCode ierr; 17407a0e7b2cSstefano_zampini IS nis; 17417a0e7b2cSstefano_zampini const PetscInt *idxs; 17427a0e7b2cSstefano_zampini PetscInt i,nd,n = matis->A->rmap->n,*nidxs,nnd; 17437a0e7b2cSstefano_zampini PetscBool *ld; 17447a0e7b2cSstefano_zampini 17457a0e7b2cSstefano_zampini PetscFunctionBegin; 17467a0e7b2cSstefano_zampini if (mop != MPI_LAND && mop != MPI_LOR) SETERRQ(PetscObjectComm((PetscObject)(pc)),PETSC_ERR_SUP,"Supported are MPI_LAND and MPI_LOR"); 17477a0e7b2cSstefano_zampini ierr = MatISSetUpSF(pc->pmat);CHKERRQ(ierr); 17487a0e7b2cSstefano_zampini if (mop == MPI_LAND) { 17497a0e7b2cSstefano_zampini /* init rootdata with true */ 17507a0e7b2cSstefano_zampini ld = (PetscBool*) matis->sf_rootdata; 17517a0e7b2cSstefano_zampini for (i=0;i<pc->pmat->rmap->n;i++) ld[i] = PETSC_TRUE; 17527a0e7b2cSstefano_zampini } else { 17537a0e7b2cSstefano_zampini ierr = PetscMemzero(matis->sf_rootdata,pc->pmat->rmap->n*sizeof(PetscBool));CHKERRQ(ierr); 17547a0e7b2cSstefano_zampini } 17557a0e7b2cSstefano_zampini ierr = PetscMemzero(matis->sf_leafdata,n*sizeof(PetscBool));CHKERRQ(ierr); 17567a0e7b2cSstefano_zampini ierr = ISGetLocalSize(*is,&nd);CHKERRQ(ierr); 17577a0e7b2cSstefano_zampini ierr = ISGetIndices(*is,&idxs);CHKERRQ(ierr); 17587a0e7b2cSstefano_zampini ld = (PetscBool*) matis->sf_leafdata; 17597a0e7b2cSstefano_zampini for (i=0;i<nd;i++) 17607a0e7b2cSstefano_zampini if (-1 < idxs[i] && idxs[i] < n) 17617a0e7b2cSstefano_zampini ld[idxs[i]] = PETSC_TRUE; 17627a0e7b2cSstefano_zampini ierr = ISRestoreIndices(*is,&idxs);CHKERRQ(ierr); 17637a0e7b2cSstefano_zampini ierr = PetscSFReduceBegin(matis->sf,MPIU_BOOL,matis->sf_leafdata,matis->sf_rootdata,mop);CHKERRQ(ierr); 17647a0e7b2cSstefano_zampini ierr = PetscSFReduceEnd(matis->sf,MPIU_BOOL,matis->sf_leafdata,matis->sf_rootdata,mop);CHKERRQ(ierr); 17657a0e7b2cSstefano_zampini ierr = PetscSFBcastBegin(matis->sf,MPIU_BOOL,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 17667a0e7b2cSstefano_zampini ierr = PetscSFBcastEnd(matis->sf,MPIU_BOOL,matis->sf_rootdata,matis->sf_leafdata);CHKERRQ(ierr); 17677a0e7b2cSstefano_zampini if (mop == MPI_LAND) { 17687a0e7b2cSstefano_zampini ierr = PetscMalloc1(nd,&nidxs);CHKERRQ(ierr); 17697a0e7b2cSstefano_zampini } else { 17707a0e7b2cSstefano_zampini ierr = PetscMalloc1(n,&nidxs);CHKERRQ(ierr); 17717a0e7b2cSstefano_zampini } 17727a0e7b2cSstefano_zampini for (i=0,nnd=0;i<n;i++) 17737a0e7b2cSstefano_zampini if (ld[i]) 17747a0e7b2cSstefano_zampini nidxs[nnd++] = i; 17757a0e7b2cSstefano_zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(*is)),nnd,nidxs,PETSC_OWN_POINTER,&nis);CHKERRQ(ierr); 17767a0e7b2cSstefano_zampini ierr = ISDestroy(is);CHKERRQ(ierr); 17777a0e7b2cSstefano_zampini *is = nis; 17781f4df5f7SStefano Zampini PetscFunctionReturn(0); 17791f4df5f7SStefano Zampini } 17801f4df5f7SStefano Zampini 17813e589ea0SStefano Zampini PetscErrorCode PCBDDCBenignRemoveInterior(PC pc,Vec r,Vec z) 17823e589ea0SStefano Zampini { 17833e589ea0SStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 17843e589ea0SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 17853e589ea0SStefano Zampini PetscErrorCode ierr; 17863e589ea0SStefano Zampini 17873e589ea0SStefano Zampini PetscFunctionBegin; 17883e589ea0SStefano Zampini if (!pcbddc->benign_have_null) { 17893e589ea0SStefano Zampini PetscFunctionReturn(0); 17903e589ea0SStefano Zampini } 17913e589ea0SStefano Zampini if (pcbddc->ChangeOfBasisMatrix) { 17923e589ea0SStefano Zampini Vec swap; 17933e589ea0SStefano Zampini 17943e589ea0SStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,r,pcbddc->work_change);CHKERRQ(ierr); 17953e589ea0SStefano Zampini swap = pcbddc->work_change; 17963e589ea0SStefano Zampini pcbddc->work_change = r; 17973e589ea0SStefano Zampini r = swap; 17983e589ea0SStefano Zampini } 17993e589ea0SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18003e589ea0SStefano Zampini ierr = VecScatterEnd(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18013e589ea0SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 18023e589ea0SStefano Zampini ierr = VecSet(z,0.);CHKERRQ(ierr); 18033e589ea0SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18043e589ea0SStefano Zampini ierr = VecScatterEnd(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18053e589ea0SStefano Zampini if (pcbddc->ChangeOfBasisMatrix) { 1806f913dca9SStefano Zampini pcbddc->work_change = r; 18073e589ea0SStefano Zampini ierr = VecCopy(z,pcbddc->work_change);CHKERRQ(ierr); 18083e589ea0SStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcbddc->work_change,z);CHKERRQ(ierr); 18093e589ea0SStefano Zampini } 18103e589ea0SStefano Zampini PetscFunctionReturn(0); 18113e589ea0SStefano Zampini } 18123e589ea0SStefano Zampini 1813a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMult_Private_Private(Mat A, Vec x, Vec y, PetscBool transpose) 1814a3df083aSStefano Zampini { 1815a3df083aSStefano Zampini PCBDDCBenignMatMult_ctx ctx; 1816a3df083aSStefano Zampini PetscErrorCode ierr; 1817a3df083aSStefano Zampini PetscBool apply_right,apply_left,reset_x; 1818a3df083aSStefano Zampini 1819a3df083aSStefano Zampini PetscFunctionBegin; 1820a3df083aSStefano Zampini ierr = MatShellGetContext(A,&ctx);CHKERRQ(ierr); 1821a3df083aSStefano Zampini if (transpose) { 1822a3df083aSStefano Zampini apply_right = ctx->apply_left; 1823a3df083aSStefano Zampini apply_left = ctx->apply_right; 1824a3df083aSStefano Zampini } else { 1825a3df083aSStefano Zampini apply_right = ctx->apply_right; 1826a3df083aSStefano Zampini apply_left = ctx->apply_left; 1827a3df083aSStefano Zampini } 1828a3df083aSStefano Zampini reset_x = PETSC_FALSE; 1829a3df083aSStefano Zampini if (apply_right) { 1830a3df083aSStefano Zampini const PetscScalar *ax; 1831a3df083aSStefano Zampini PetscInt nl,i; 1832a3df083aSStefano Zampini 1833a3df083aSStefano Zampini ierr = VecGetLocalSize(x,&nl);CHKERRQ(ierr); 1834a3df083aSStefano Zampini ierr = VecGetArrayRead(x,&ax);CHKERRQ(ierr); 1835a3df083aSStefano Zampini ierr = PetscMemcpy(ctx->work,ax,nl*sizeof(PetscScalar));CHKERRQ(ierr); 1836a3df083aSStefano Zampini ierr = VecRestoreArrayRead(x,&ax);CHKERRQ(ierr); 1837a3df083aSStefano Zampini for (i=0;i<ctx->benign_n;i++) { 1838a3df083aSStefano Zampini PetscScalar sum,val; 1839a3df083aSStefano Zampini const PetscInt *idxs; 1840a3df083aSStefano Zampini PetscInt nz,j; 1841a3df083aSStefano Zampini ierr = ISGetLocalSize(ctx->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 1842a3df083aSStefano Zampini ierr = ISGetIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1843a3df083aSStefano Zampini sum = 0.; 1844a3df083aSStefano Zampini if (ctx->apply_p0) { 1845a3df083aSStefano Zampini val = ctx->work[idxs[nz-1]]; 1846a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1847a3df083aSStefano Zampini sum += ctx->work[idxs[j]]; 1848a3df083aSStefano Zampini ctx->work[idxs[j]] += val; 1849a3df083aSStefano Zampini } 1850a3df083aSStefano Zampini } else { 1851a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1852a3df083aSStefano Zampini sum += ctx->work[idxs[j]]; 1853a3df083aSStefano Zampini } 1854a3df083aSStefano Zampini } 1855a3df083aSStefano Zampini ctx->work[idxs[nz-1]] -= sum; 1856a3df083aSStefano Zampini ierr = ISRestoreIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1857a3df083aSStefano Zampini } 1858a3df083aSStefano Zampini ierr = VecPlaceArray(x,ctx->work);CHKERRQ(ierr); 1859a3df083aSStefano Zampini reset_x = PETSC_TRUE; 1860a3df083aSStefano Zampini } 1861a3df083aSStefano Zampini if (transpose) { 1862a3df083aSStefano Zampini ierr = MatMultTranspose(ctx->A,x,y);CHKERRQ(ierr); 1863a3df083aSStefano Zampini } else { 1864a3df083aSStefano Zampini ierr = MatMult(ctx->A,x,y);CHKERRQ(ierr); 1865a3df083aSStefano Zampini } 1866a3df083aSStefano Zampini if (reset_x) { 1867a3df083aSStefano Zampini ierr = VecResetArray(x);CHKERRQ(ierr); 1868a3df083aSStefano Zampini } 1869a3df083aSStefano Zampini if (apply_left) { 1870a3df083aSStefano Zampini PetscScalar *ay; 1871a3df083aSStefano Zampini PetscInt i; 1872a3df083aSStefano Zampini 1873a3df083aSStefano Zampini ierr = VecGetArray(y,&ay);CHKERRQ(ierr); 1874a3df083aSStefano Zampini for (i=0;i<ctx->benign_n;i++) { 1875a3df083aSStefano Zampini PetscScalar sum,val; 1876a3df083aSStefano Zampini const PetscInt *idxs; 1877a3df083aSStefano Zampini PetscInt nz,j; 1878a3df083aSStefano Zampini ierr = ISGetLocalSize(ctx->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 1879a3df083aSStefano Zampini ierr = ISGetIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1880a3df083aSStefano Zampini val = -ay[idxs[nz-1]]; 1881a3df083aSStefano Zampini if (ctx->apply_p0) { 1882a3df083aSStefano Zampini sum = 0.; 1883a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1884a3df083aSStefano Zampini sum += ay[idxs[j]]; 1885a3df083aSStefano Zampini ay[idxs[j]] += val; 1886a3df083aSStefano Zampini } 1887a3df083aSStefano Zampini ay[idxs[nz-1]] += sum; 1888a3df083aSStefano Zampini } else { 1889a3df083aSStefano Zampini for (j=0;j<nz-1;j++) { 1890a3df083aSStefano Zampini ay[idxs[j]] += val; 1891a3df083aSStefano Zampini } 1892a3df083aSStefano Zampini ay[idxs[nz-1]] = 0.; 1893a3df083aSStefano Zampini } 1894a3df083aSStefano Zampini ierr = ISRestoreIndices(ctx->benign_zerodiag_subs[i],&idxs);CHKERRQ(ierr); 1895a3df083aSStefano Zampini } 1896a3df083aSStefano Zampini ierr = VecRestoreArray(y,&ay);CHKERRQ(ierr); 1897a3df083aSStefano Zampini } 1898a3df083aSStefano Zampini PetscFunctionReturn(0); 1899a3df083aSStefano Zampini } 1900a3df083aSStefano Zampini 1901a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMultTranspose_Private(Mat A, Vec x, Vec y) 1902a3df083aSStefano Zampini { 1903a3df083aSStefano Zampini PetscErrorCode ierr; 1904a3df083aSStefano Zampini 1905a3df083aSStefano Zampini PetscFunctionBegin; 1906a3df083aSStefano Zampini ierr = PCBDDCBenignMatMult_Private_Private(A,x,y,PETSC_TRUE);CHKERRQ(ierr); 1907a3df083aSStefano Zampini PetscFunctionReturn(0); 1908a3df083aSStefano Zampini } 1909a3df083aSStefano Zampini 1910a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignMatMult_Private(Mat A, Vec x, Vec y) 1911a3df083aSStefano Zampini { 1912a3df083aSStefano Zampini PetscErrorCode ierr; 1913a3df083aSStefano Zampini 1914a3df083aSStefano Zampini PetscFunctionBegin; 1915a3df083aSStefano Zampini ierr = PCBDDCBenignMatMult_Private_Private(A,x,y,PETSC_FALSE);CHKERRQ(ierr); 1916a3df083aSStefano Zampini PetscFunctionReturn(0); 1917a3df083aSStefano Zampini } 1918a3df083aSStefano Zampini 1919a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignShellMat(PC pc, PetscBool restore) 1920a3df083aSStefano Zampini { 1921a3df083aSStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 1922a3df083aSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1923a3df083aSStefano Zampini PCBDDCBenignMatMult_ctx ctx; 1924a3df083aSStefano Zampini PetscErrorCode ierr; 1925a3df083aSStefano Zampini 1926a3df083aSStefano Zampini PetscFunctionBegin; 1927a3df083aSStefano Zampini if (!restore) { 19281dd7afcfSStefano Zampini Mat A_IB,A_BI; 1929a3df083aSStefano Zampini PetscScalar *work; 1930b334f244SStefano Zampini PCBDDCReuseSolvers reuse = pcbddc->sub_schurs ? pcbddc->sub_schurs->reuse_solver : NULL; 1931a3df083aSStefano Zampini 19329a962809SStefano Zampini if (pcbddc->benign_original_mat) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Benign original mat has not been restored"); 19339a962809SStefano Zampini if (!pcbddc->benign_change || !pcbddc->benign_n || pcbddc->benign_change_explicit) PetscFunctionReturn(0); 1934a3df083aSStefano Zampini ierr = PetscMalloc1(pcis->n,&work);CHKERRQ(ierr); 1935a3df083aSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&A_IB);CHKERRQ(ierr); 1936a3df083aSStefano Zampini ierr = MatSetSizes(A_IB,pcis->n-pcis->n_B,pcis->n_B,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 1937a3df083aSStefano Zampini ierr = MatSetType(A_IB,MATSHELL);CHKERRQ(ierr); 1938a3df083aSStefano Zampini ierr = MatShellSetOperation(A_IB,MATOP_MULT,(void (*)(void))PCBDDCBenignMatMult_Private);CHKERRQ(ierr); 1939a3df083aSStefano Zampini ierr = MatShellSetOperation(A_IB,MATOP_MULT_TRANSPOSE,(void (*)(void))PCBDDCBenignMatMultTranspose_Private);CHKERRQ(ierr); 1940a3df083aSStefano Zampini ierr = PetscNew(&ctx);CHKERRQ(ierr); 1941a3df083aSStefano Zampini ierr = MatShellSetContext(A_IB,ctx);CHKERRQ(ierr); 1942a3df083aSStefano Zampini ctx->apply_left = PETSC_TRUE; 1943a3df083aSStefano Zampini ctx->apply_right = PETSC_FALSE; 1944a3df083aSStefano Zampini ctx->apply_p0 = PETSC_FALSE; 1945a3df083aSStefano Zampini ctx->benign_n = pcbddc->benign_n; 1946059032f7SStefano Zampini if (reuse) { 1947a3df083aSStefano Zampini ctx->benign_zerodiag_subs = reuse->benign_zerodiag_subs; 19481dd7afcfSStefano Zampini ctx->free = PETSC_FALSE; 1949059032f7SStefano Zampini } else { /* TODO: could be optimized for successive solves */ 1950059032f7SStefano Zampini ISLocalToGlobalMapping N_to_D; 1951059032f7SStefano Zampini PetscInt i; 1952059032f7SStefano Zampini 1953059032f7SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(pcis->is_I_local,&N_to_D);CHKERRQ(ierr); 1954059032f7SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&ctx->benign_zerodiag_subs);CHKERRQ(ierr); 1955059032f7SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 1956059032f7SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(N_to_D,IS_GTOLM_DROP,pcbddc->benign_zerodiag_subs[i],&ctx->benign_zerodiag_subs[i]);CHKERRQ(ierr); 1957059032f7SStefano Zampini } 1958059032f7SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&N_to_D);CHKERRQ(ierr); 19591dd7afcfSStefano Zampini ctx->free = PETSC_TRUE; 1960059032f7SStefano Zampini } 1961a3df083aSStefano Zampini ctx->A = pcis->A_IB; 1962a3df083aSStefano Zampini ctx->work = work; 1963a3df083aSStefano Zampini ierr = MatSetUp(A_IB);CHKERRQ(ierr); 1964a3df083aSStefano Zampini ierr = MatAssemblyBegin(A_IB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1965a3df083aSStefano Zampini ierr = MatAssemblyEnd(A_IB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1966a3df083aSStefano Zampini pcis->A_IB = A_IB; 1967a3df083aSStefano Zampini 1968a3df083aSStefano Zampini /* A_BI as A_IB^T */ 1969a3df083aSStefano Zampini ierr = MatCreateTranspose(A_IB,&A_BI);CHKERRQ(ierr); 1970a3df083aSStefano Zampini pcbddc->benign_original_mat = pcis->A_BI; 1971a3df083aSStefano Zampini pcis->A_BI = A_BI; 1972a3df083aSStefano Zampini } else { 19731dd7afcfSStefano Zampini if (!pcbddc->benign_original_mat) { 19741dd7afcfSStefano Zampini PetscFunctionReturn(0); 19751dd7afcfSStefano Zampini } 1976a3df083aSStefano Zampini ierr = MatShellGetContext(pcis->A_IB,&ctx);CHKERRQ(ierr); 1977a3df083aSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 1978a3df083aSStefano Zampini pcis->A_IB = ctx->A; 19791dd7afcfSStefano Zampini ctx->A = NULL; 19801dd7afcfSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 19811dd7afcfSStefano Zampini pcis->A_BI = pcbddc->benign_original_mat; 19821dd7afcfSStefano Zampini pcbddc->benign_original_mat = NULL; 19831dd7afcfSStefano Zampini if (ctx->free) { 1984059032f7SStefano Zampini PetscInt i; 19851dd7afcfSStefano Zampini for (i=0;i<ctx->benign_n;i++) { 1986059032f7SStefano Zampini ierr = ISDestroy(&ctx->benign_zerodiag_subs[i]);CHKERRQ(ierr); 1987059032f7SStefano Zampini } 1988059032f7SStefano Zampini ierr = PetscFree(ctx->benign_zerodiag_subs);CHKERRQ(ierr); 1989059032f7SStefano Zampini } 1990a3df083aSStefano Zampini ierr = PetscFree(ctx->work);CHKERRQ(ierr); 1991a3df083aSStefano Zampini ierr = PetscFree(ctx);CHKERRQ(ierr); 1992a3df083aSStefano Zampini } 1993a3df083aSStefano Zampini PetscFunctionReturn(0); 1994a3df083aSStefano Zampini } 1995a3df083aSStefano Zampini 1996a3df083aSStefano Zampini /* used just in bddc debug mode */ 1997a3df083aSStefano Zampini PetscErrorCode PCBDDCBenignProject(PC pc, IS is1, IS is2, Mat *B) 1998a3df083aSStefano Zampini { 1999a3df083aSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2000a3df083aSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2001a3df083aSStefano Zampini Mat An; 2002a3df083aSStefano Zampini PetscErrorCode ierr; 2003a3df083aSStefano Zampini 2004a3df083aSStefano Zampini PetscFunctionBegin; 2005a3df083aSStefano Zampini ierr = MatPtAP(matis->A,pcbddc->benign_change,MAT_INITIAL_MATRIX,2.0,&An);CHKERRQ(ierr); 2006a3df083aSStefano Zampini ierr = MatZeroRowsColumns(An,pcbddc->benign_n,pcbddc->benign_p0_lidx,1.0,NULL,NULL);CHKERRQ(ierr); 2007a3df083aSStefano Zampini if (is1) { 20087dae84e0SHong Zhang ierr = MatCreateSubMatrix(An,is1,is2,MAT_INITIAL_MATRIX,B);CHKERRQ(ierr); 2009a3df083aSStefano Zampini ierr = MatDestroy(&An);CHKERRQ(ierr); 2010a3df083aSStefano Zampini } else { 2011a3df083aSStefano Zampini *B = An; 2012a3df083aSStefano Zampini } 2013a3df083aSStefano Zampini PetscFunctionReturn(0); 2014a3df083aSStefano Zampini } 2015a3df083aSStefano Zampini 20161cf9b237SStefano Zampini /* TODO: add reuse flag */ 20171cf9b237SStefano Zampini PetscErrorCode MatSeqAIJCompress(Mat A, Mat *B) 20181cf9b237SStefano Zampini { 20191cf9b237SStefano Zampini Mat Bt; 20201cf9b237SStefano Zampini PetscScalar *a,*bdata; 20211cf9b237SStefano Zampini const PetscInt *ii,*ij; 20221cf9b237SStefano Zampini PetscInt m,n,i,nnz,*bii,*bij; 20231cf9b237SStefano Zampini PetscBool flg_row; 20241cf9b237SStefano Zampini PetscErrorCode ierr; 20251cf9b237SStefano Zampini 20261cf9b237SStefano Zampini PetscFunctionBegin; 20271cf9b237SStefano Zampini ierr = MatGetSize(A,&n,&m);CHKERRQ(ierr); 20281cf9b237SStefano Zampini ierr = MatGetRowIJ(A,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&ij,&flg_row);CHKERRQ(ierr); 20291cf9b237SStefano Zampini ierr = MatSeqAIJGetArray(A,&a);CHKERRQ(ierr); 20301cf9b237SStefano Zampini nnz = n; 20311cf9b237SStefano Zampini for (i=0;i<ii[n];i++) { 20321cf9b237SStefano Zampini if (PetscLikely(PetscAbsScalar(a[i]) > PETSC_SMALL)) nnz++; 20331cf9b237SStefano Zampini } 20341cf9b237SStefano Zampini ierr = PetscMalloc1(n+1,&bii);CHKERRQ(ierr); 20351cf9b237SStefano Zampini ierr = PetscMalloc1(nnz,&bij);CHKERRQ(ierr); 20361cf9b237SStefano Zampini ierr = PetscMalloc1(nnz,&bdata);CHKERRQ(ierr); 20371cf9b237SStefano Zampini nnz = 0; 20381cf9b237SStefano Zampini bii[0] = 0; 20391cf9b237SStefano Zampini for (i=0;i<n;i++) { 20401cf9b237SStefano Zampini PetscInt j; 20411cf9b237SStefano Zampini for (j=ii[i];j<ii[i+1];j++) { 20421cf9b237SStefano Zampini PetscScalar entry = a[j]; 20431cf9b237SStefano Zampini if (PetscLikely(PetscAbsScalar(entry) > PETSC_SMALL) || ij[j] == i) { 20441cf9b237SStefano Zampini bij[nnz] = ij[j]; 20451cf9b237SStefano Zampini bdata[nnz] = entry; 20461cf9b237SStefano Zampini nnz++; 20471cf9b237SStefano Zampini } 20481cf9b237SStefano Zampini } 20491cf9b237SStefano Zampini bii[i+1] = nnz; 20501cf9b237SStefano Zampini } 20511cf9b237SStefano Zampini ierr = MatSeqAIJRestoreArray(A,&a);CHKERRQ(ierr); 20521cf9b237SStefano Zampini ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),n,m,bii,bij,bdata,&Bt);CHKERRQ(ierr); 20531cf9b237SStefano Zampini ierr = MatRestoreRowIJ(A,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&ij,&flg_row);CHKERRQ(ierr); 20541cf9b237SStefano Zampini { 20551cf9b237SStefano Zampini Mat_SeqAIJ *b = (Mat_SeqAIJ*)(Bt->data); 20561cf9b237SStefano Zampini b->free_a = PETSC_TRUE; 20571cf9b237SStefano Zampini b->free_ij = PETSC_TRUE; 20581cf9b237SStefano Zampini } 20591cf9b237SStefano Zampini *B = Bt; 20601cf9b237SStefano Zampini PetscFunctionReturn(0); 20611cf9b237SStefano Zampini } 20621cf9b237SStefano Zampini 2063c80a6c00SStefano Zampini PetscErrorCode PCBDDCDetectDisconnectedComponents(PC pc, PetscInt *ncc, IS* cc[], IS* primalv) 20644f1b2e48SStefano Zampini { 2065c80a6c00SStefano Zampini Mat B = NULL; 2066c80a6c00SStefano Zampini DM dm; 20674f1b2e48SStefano Zampini IS is_dummy,*cc_n; 20684f1b2e48SStefano Zampini ISLocalToGlobalMapping l2gmap_dummy; 20694f1b2e48SStefano Zampini PCBDDCGraph graph; 2070c80a6c00SStefano Zampini PetscInt *xadj_filtered = NULL,*adjncy_filtered = NULL; 20714f1b2e48SStefano Zampini PetscInt i,n; 20724f1b2e48SStefano Zampini PetscInt *xadj,*adjncy; 2073c80a6c00SStefano Zampini PetscBool isplex = PETSC_FALSE; 20744f1b2e48SStefano Zampini PetscErrorCode ierr; 20754f1b2e48SStefano Zampini 20764f1b2e48SStefano Zampini PetscFunctionBegin; 2077c80a6c00SStefano Zampini ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr); 2078c80a6c00SStefano Zampini ierr = PCGetDM(pc,&dm);CHKERRQ(ierr); 2079c80a6c00SStefano Zampini if (!dm) { 2080c80a6c00SStefano Zampini ierr = MatGetDM(pc->pmat,&dm);CHKERRQ(ierr); 2081c80a6c00SStefano Zampini } 2082c80a6c00SStefano Zampini if (dm) { 2083c80a6c00SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)dm,DMPLEX,&isplex);CHKERRQ(ierr); 2084c80a6c00SStefano Zampini } 2085c80a6c00SStefano Zampini if (isplex) { /* this code has been modified from plexpartition.c */ 2086c80a6c00SStefano Zampini PetscInt p, pStart, pEnd, a, adjSize, idx, size, nroots; 2087c80a6c00SStefano Zampini PetscInt *adj = NULL; 2088c80a6c00SStefano Zampini IS cellNumbering; 2089c80a6c00SStefano Zampini const PetscInt *cellNum; 2090c80a6c00SStefano Zampini PetscBool useCone, useClosure; 2091c80a6c00SStefano Zampini PetscSection section; 2092c80a6c00SStefano Zampini PetscSegBuffer adjBuffer; 2093c80a6c00SStefano Zampini PetscSF sfPoint; 2094c80a6c00SStefano Zampini PetscErrorCode ierr; 2095c80a6c00SStefano Zampini 2096c80a6c00SStefano Zampini PetscFunctionBegin; 2097c80a6c00SStefano Zampini ierr = DMPlexGetHeightStratum(dm, 0, &pStart, &pEnd);CHKERRQ(ierr); 2098c80a6c00SStefano Zampini ierr = DMGetPointSF(dm, &sfPoint);CHKERRQ(ierr); 2099c80a6c00SStefano Zampini ierr = PetscSFGetGraph(sfPoint, &nroots, NULL, NULL, NULL);CHKERRQ(ierr); 2100c80a6c00SStefano Zampini /* Build adjacency graph via a section/segbuffer */ 2101c80a6c00SStefano Zampini ierr = PetscSectionCreate(PetscObjectComm((PetscObject) dm), §ion);CHKERRQ(ierr); 2102c80a6c00SStefano Zampini ierr = PetscSectionSetChart(section, pStart, pEnd);CHKERRQ(ierr); 2103c80a6c00SStefano Zampini ierr = PetscSegBufferCreate(sizeof(PetscInt),1000,&adjBuffer);CHKERRQ(ierr); 2104c80a6c00SStefano Zampini /* Always use FVM adjacency to create partitioner graph */ 2105c80a6c00SStefano Zampini ierr = DMPlexGetAdjacencyUseCone(dm, &useCone);CHKERRQ(ierr); 2106c80a6c00SStefano Zampini ierr = DMPlexGetAdjacencyUseClosure(dm, &useClosure);CHKERRQ(ierr); 2107c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseCone(dm, PETSC_TRUE);CHKERRQ(ierr); 2108c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseClosure(dm, PETSC_FALSE);CHKERRQ(ierr); 2109956e2312SStefano Zampini ierr = DMPlexGetCellNumbering(dm, &cellNumbering);CHKERRQ(ierr); 2110c80a6c00SStefano Zampini ierr = ISGetIndices(cellNumbering, &cellNum);CHKERRQ(ierr); 2111c80a6c00SStefano Zampini for (n = 0, p = pStart; p < pEnd; p++) { 2112c80a6c00SStefano Zampini /* Skip non-owned cells in parallel (ParMetis expects no overlap) */ 2113c80a6c00SStefano Zampini if (nroots > 0) {if (cellNum[p] < 0) continue;} 2114c80a6c00SStefano Zampini adjSize = PETSC_DETERMINE; 2115c80a6c00SStefano Zampini ierr = DMPlexGetAdjacency(dm, p, &adjSize, &adj);CHKERRQ(ierr); 2116c80a6c00SStefano Zampini for (a = 0; a < adjSize; ++a) { 2117c80a6c00SStefano Zampini const PetscInt point = adj[a]; 21185cef3d0dSStefano Zampini if (pStart <= point && point < pEnd) { 2119c80a6c00SStefano Zampini PetscInt *PETSC_RESTRICT pBuf; 2120c80a6c00SStefano Zampini ierr = PetscSectionAddDof(section, p, 1);CHKERRQ(ierr); 2121c80a6c00SStefano Zampini ierr = PetscSegBufferGetInts(adjBuffer, 1, &pBuf);CHKERRQ(ierr); 2122c80a6c00SStefano Zampini *pBuf = point; 2123c80a6c00SStefano Zampini } 2124c80a6c00SStefano Zampini } 2125c80a6c00SStefano Zampini n++; 2126c80a6c00SStefano Zampini } 2127c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseCone(dm, useCone);CHKERRQ(ierr); 2128c80a6c00SStefano Zampini ierr = DMPlexSetAdjacencyUseClosure(dm, useClosure);CHKERRQ(ierr); 2129c80a6c00SStefano Zampini /* Derive CSR graph from section/segbuffer */ 2130c80a6c00SStefano Zampini ierr = PetscSectionSetUp(section);CHKERRQ(ierr); 2131c80a6c00SStefano Zampini ierr = PetscSectionGetStorageSize(section, &size);CHKERRQ(ierr); 2132c80a6c00SStefano Zampini ierr = PetscMalloc1(n+1, &xadj);CHKERRQ(ierr); 2133c80a6c00SStefano Zampini for (idx = 0, p = pStart; p < pEnd; p++) { 2134c80a6c00SStefano Zampini if (nroots > 0) {if (cellNum[p] < 0) continue;} 2135c80a6c00SStefano Zampini ierr = PetscSectionGetOffset(section, p, &(xadj[idx++]));CHKERRQ(ierr); 2136c80a6c00SStefano Zampini } 2137c80a6c00SStefano Zampini xadj[n] = size; 2138c80a6c00SStefano Zampini ierr = PetscSegBufferExtractAlloc(adjBuffer, &adjncy);CHKERRQ(ierr); 2139c80a6c00SStefano Zampini /* Clean up */ 2140c80a6c00SStefano Zampini ierr = PetscSegBufferDestroy(&adjBuffer);CHKERRQ(ierr); 2141c80a6c00SStefano Zampini ierr = PetscSectionDestroy(§ion);CHKERRQ(ierr); 2142c80a6c00SStefano Zampini ierr = PetscFree(adj);CHKERRQ(ierr); 2143c80a6c00SStefano Zampini graph->xadj = xadj; 2144c80a6c00SStefano Zampini graph->adjncy = adjncy; 2145c80a6c00SStefano Zampini } else { 2146c80a6c00SStefano Zampini Mat A; 2147c80a6c00SStefano Zampini PetscBool filter = PETSC_FALSE, isseqaij, flg_row; 2148c80a6c00SStefano Zampini 2149c80a6c00SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 215063c961adSStefano Zampini if (!A->rmap->N || !A->cmap->N) { 215163c961adSStefano Zampini *ncc = 0; 215263c961adSStefano Zampini *cc = NULL; 215363c961adSStefano Zampini PetscFunctionReturn(0); 215463c961adSStefano Zampini } 21554f1b2e48SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 21564f1b2e48SStefano Zampini if (!isseqaij && filter) { 21571cf9b237SStefano Zampini PetscBool isseqdense; 21581cf9b237SStefano Zampini 21591cf9b237SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQDENSE,&isseqdense);CHKERRQ(ierr); 21601cf9b237SStefano Zampini if (!isseqdense) { 21614f1b2e48SStefano Zampini ierr = MatConvert(A,MATSEQAIJ,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr); 21621cf9b237SStefano Zampini } else { /* TODO: rectangular case and LDA */ 21631cf9b237SStefano Zampini PetscScalar *array; 21641cf9b237SStefano Zampini PetscReal chop=1.e-6; 21651cf9b237SStefano Zampini 21661cf9b237SStefano Zampini ierr = MatDuplicate(A,MAT_COPY_VALUES,&B);CHKERRQ(ierr); 21671cf9b237SStefano Zampini ierr = MatDenseGetArray(B,&array);CHKERRQ(ierr); 21681cf9b237SStefano Zampini ierr = MatGetSize(B,&n,NULL);CHKERRQ(ierr); 21691cf9b237SStefano Zampini for (i=0;i<n;i++) { 21701cf9b237SStefano Zampini PetscInt j; 21711cf9b237SStefano Zampini for (j=i+1;j<n;j++) { 21721cf9b237SStefano Zampini PetscReal thresh = chop*(PetscAbsScalar(array[i*(n+1)])+PetscAbsScalar(array[j*(n+1)])); 21731cf9b237SStefano Zampini if (PetscAbsScalar(array[i*n+j]) < thresh) array[i*n+j] = 0.; 21741cf9b237SStefano Zampini if (PetscAbsScalar(array[j*n+i]) < thresh) array[j*n+i] = 0.; 21751cf9b237SStefano Zampini } 21761cf9b237SStefano Zampini } 21771cf9b237SStefano Zampini ierr = MatDenseRestoreArray(B,&array);CHKERRQ(ierr); 21789d54b7f4SStefano Zampini ierr = MatConvert(B,MATSEQAIJ,MAT_INPLACE_MATRIX,&B);CHKERRQ(ierr); 21791cf9b237SStefano Zampini } 21804f1b2e48SStefano Zampini } else { 2181c80a6c00SStefano Zampini ierr = PetscObjectReference((PetscObject)A);CHKERRQ(ierr); 21824f1b2e48SStefano Zampini B = A; 21834f1b2e48SStefano Zampini } 21844f1b2e48SStefano Zampini ierr = MatGetRowIJ(B,0,PETSC_TRUE,PETSC_FALSE,&n,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 21854f1b2e48SStefano Zampini 21864f1b2e48SStefano Zampini /* if filter is true, then removes entries lower than PETSC_SMALL in magnitude */ 21874f1b2e48SStefano Zampini if (filter) { 21884f1b2e48SStefano Zampini PetscScalar *data; 21894f1b2e48SStefano Zampini PetscInt j,cum; 21904f1b2e48SStefano Zampini 21914f1b2e48SStefano Zampini ierr = PetscCalloc2(n+1,&xadj_filtered,xadj[n],&adjncy_filtered);CHKERRQ(ierr); 21924f1b2e48SStefano Zampini ierr = MatSeqAIJGetArray(B,&data);CHKERRQ(ierr); 21934f1b2e48SStefano Zampini cum = 0; 21944f1b2e48SStefano Zampini for (i=0;i<n;i++) { 21954f1b2e48SStefano Zampini PetscInt t; 21964f1b2e48SStefano Zampini 21974f1b2e48SStefano Zampini for (j=xadj[i];j<xadj[i+1];j++) { 21984f1b2e48SStefano Zampini if (PetscUnlikely(PetscAbsScalar(data[j]) < PETSC_SMALL)) { 21994f1b2e48SStefano Zampini continue; 22004f1b2e48SStefano Zampini } 22014f1b2e48SStefano Zampini adjncy_filtered[cum+xadj_filtered[i]++] = adjncy[j]; 22024f1b2e48SStefano Zampini } 22034f1b2e48SStefano Zampini t = xadj_filtered[i]; 22044f1b2e48SStefano Zampini xadj_filtered[i] = cum; 22054f1b2e48SStefano Zampini cum += t; 22064f1b2e48SStefano Zampini } 22074f1b2e48SStefano Zampini ierr = MatSeqAIJRestoreArray(B,&data);CHKERRQ(ierr); 22084f1b2e48SStefano Zampini graph->xadj = xadj_filtered; 22094f1b2e48SStefano Zampini graph->adjncy = adjncy_filtered; 22104f1b2e48SStefano Zampini } else { 22114f1b2e48SStefano Zampini graph->xadj = xadj; 22124f1b2e48SStefano Zampini graph->adjncy = adjncy; 22134f1b2e48SStefano Zampini } 2214c80a6c00SStefano Zampini } 2215c80a6c00SStefano Zampini /* compute local connected components using PCBDDCGraph */ 2216c80a6c00SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n,0,1,&is_dummy);CHKERRQ(ierr); 2217c80a6c00SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_dummy,&l2gmap_dummy);CHKERRQ(ierr); 2218c80a6c00SStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 2219c80a6c00SStefano Zampini ierr = PCBDDCGraphInit(graph,l2gmap_dummy,n,PETSC_MAX_INT);CHKERRQ(ierr); 2220c80a6c00SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2gmap_dummy);CHKERRQ(ierr); 22214f1b2e48SStefano Zampini ierr = PCBDDCGraphSetUp(graph,1,NULL,NULL,0,NULL,NULL);CHKERRQ(ierr); 22224f1b2e48SStefano Zampini ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr); 2223c80a6c00SStefano Zampini 22244f1b2e48SStefano Zampini /* partial clean up */ 22254f1b2e48SStefano Zampini ierr = PetscFree2(xadj_filtered,adjncy_filtered);CHKERRQ(ierr); 2226c80a6c00SStefano Zampini if (B) { 2227c80a6c00SStefano Zampini PetscBool flg_row; 22284f1b2e48SStefano Zampini ierr = MatRestoreRowIJ(B,0,PETSC_TRUE,PETSC_FALSE,&n,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 22294f1b2e48SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 22304f1b2e48SStefano Zampini } 2231c80a6c00SStefano Zampini if (isplex) { 2232c80a6c00SStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 2233c80a6c00SStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 2234c80a6c00SStefano Zampini } 22354f1b2e48SStefano Zampini 22364f1b2e48SStefano Zampini /* get back data */ 2237c80a6c00SStefano Zampini if (isplex) { 2238c80a6c00SStefano Zampini if (ncc) *ncc = graph->ncc; 2239c80a6c00SStefano Zampini if (cc || primalv) { 2240c80a6c00SStefano Zampini Mat A; 2241c80a6c00SStefano Zampini PetscBT btv,btvt; 2242c80a6c00SStefano Zampini PetscSection subSection; 2243c80a6c00SStefano Zampini PetscInt *ids,cum,cump,*cids,*pids; 2244c80a6c00SStefano Zampini 2245c80a6c00SStefano Zampini ierr = DMPlexGetSubdomainSection(dm,&subSection);CHKERRQ(ierr); 2246c80a6c00SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 2247c80a6c00SStefano Zampini ierr = PetscMalloc3(A->rmap->n,&ids,graph->ncc+1,&cids,A->rmap->n,&pids);CHKERRQ(ierr); 2248c80a6c00SStefano Zampini ierr = PetscBTCreate(A->rmap->n,&btv);CHKERRQ(ierr); 2249c80a6c00SStefano Zampini ierr = PetscBTCreate(A->rmap->n,&btvt);CHKERRQ(ierr); 2250c80a6c00SStefano Zampini 2251c80a6c00SStefano Zampini cids[0] = 0; 2252c80a6c00SStefano Zampini for (i = 0, cump = 0, cum = 0; i < graph->ncc; i++) { 2253c80a6c00SStefano Zampini PetscInt j; 2254c80a6c00SStefano Zampini 2255c80a6c00SStefano Zampini ierr = PetscBTMemzero(A->rmap->n,btvt);CHKERRQ(ierr); 2256c80a6c00SStefano Zampini for (j = graph->cptr[i]; j < graph->cptr[i+1]; j++) { 2257c80a6c00SStefano Zampini PetscInt k, size, *closure = NULL, cell = graph->queue[j]; 2258c80a6c00SStefano Zampini 2259c80a6c00SStefano Zampini ierr = DMPlexGetTransitiveClosure(dm,cell,PETSC_TRUE,&size,&closure);CHKERRQ(ierr); 2260c80a6c00SStefano Zampini for (k = 0; k < 2*size; k += 2) { 2261c80a6c00SStefano Zampini PetscInt s, p = closure[k], off, dof, cdof; 2262c80a6c00SStefano Zampini 2263c80a6c00SStefano Zampini ierr = PetscSectionGetConstraintDof(subSection, p, &cdof);CHKERRQ(ierr); 2264c80a6c00SStefano Zampini ierr = PetscSectionGetOffset(subSection,p,&off);CHKERRQ(ierr); 2265c80a6c00SStefano Zampini ierr = PetscSectionGetDof(subSection,p,&dof);CHKERRQ(ierr); 2266c80a6c00SStefano Zampini for (s = 0; s < dof-cdof; s++) { 2267c80a6c00SStefano Zampini if (PetscBTLookupSet(btvt,off+s)) continue; 2268c80a6c00SStefano Zampini if (!PetscBTLookup(btv,off+s)) { 2269c80a6c00SStefano Zampini ids[cum++] = off+s; 2270c80a6c00SStefano Zampini } else { /* cross-vertex */ 2271c80a6c00SStefano Zampini pids[cump++] = off+s; 2272c80a6c00SStefano Zampini } 2273c80a6c00SStefano Zampini } 2274c80a6c00SStefano Zampini } 2275c80a6c00SStefano Zampini ierr = DMPlexRestoreTransitiveClosure(dm,cell,PETSC_TRUE,&size,&closure);CHKERRQ(ierr); 2276c80a6c00SStefano Zampini } 2277c80a6c00SStefano Zampini cids[i+1] = cum; 2278c80a6c00SStefano Zampini /* mark dofs as already assigned */ 2279c80a6c00SStefano Zampini for (j = cids[i]; j < cids[i+1]; j++) { 2280c80a6c00SStefano Zampini ierr = PetscBTSet(btv,ids[j]);CHKERRQ(ierr); 2281c80a6c00SStefano Zampini } 2282c80a6c00SStefano Zampini } 2283c80a6c00SStefano Zampini if (cc) { 2284c80a6c00SStefano Zampini ierr = PetscMalloc1(graph->ncc,&cc_n);CHKERRQ(ierr); 2285c80a6c00SStefano Zampini for (i = 0; i < graph->ncc; i++) { 2286c80a6c00SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,cids[i+1]-cids[i],ids+cids[i],PETSC_COPY_VALUES,&cc_n[i]);CHKERRQ(ierr); 2287c80a6c00SStefano Zampini } 2288c80a6c00SStefano Zampini *cc = cc_n; 2289c80a6c00SStefano Zampini } 2290c80a6c00SStefano Zampini if (primalv) { 2291c80a6c00SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),cump,pids,PETSC_COPY_VALUES,primalv);CHKERRQ(ierr); 2292c80a6c00SStefano Zampini } 2293c80a6c00SStefano Zampini ierr = PetscFree3(ids,cids,pids);CHKERRQ(ierr); 2294c80a6c00SStefano Zampini ierr = PetscBTDestroy(&btv);CHKERRQ(ierr); 2295c80a6c00SStefano Zampini ierr = PetscBTDestroy(&btvt);CHKERRQ(ierr); 2296c80a6c00SStefano Zampini } 2297c80a6c00SStefano Zampini } else { 22981cf9b237SStefano Zampini if (ncc) *ncc = graph->ncc; 22991cf9b237SStefano Zampini if (cc) { 23004f1b2e48SStefano Zampini ierr = PetscMalloc1(graph->ncc,&cc_n);CHKERRQ(ierr); 23014f1b2e48SStefano Zampini for (i=0;i<graph->ncc;i++) { 23024f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,graph->cptr[i+1]-graph->cptr[i],graph->queue+graph->cptr[i],PETSC_COPY_VALUES,&cc_n[i]);CHKERRQ(ierr); 23034f1b2e48SStefano Zampini } 23044f1b2e48SStefano Zampini *cc = cc_n; 23051cf9b237SStefano Zampini } 2306c80a6c00SStefano Zampini if (primalv) *primalv = NULL; 2307c80a6c00SStefano Zampini } 23084f1b2e48SStefano Zampini /* clean up graph */ 23094f1b2e48SStefano Zampini graph->xadj = 0; 23104f1b2e48SStefano Zampini graph->adjncy = 0; 23114f1b2e48SStefano Zampini ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr); 23124f1b2e48SStefano Zampini PetscFunctionReturn(0); 23134f1b2e48SStefano Zampini } 23144f1b2e48SStefano Zampini 23155408967cSStefano Zampini PetscErrorCode PCBDDCBenignCheck(PC pc, IS zerodiag) 23165408967cSStefano Zampini { 23175408967cSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 23185408967cSStefano Zampini PC_IS* pcis = (PC_IS*)(pc->data); 2319dee84bffSStefano Zampini IS dirIS = NULL; 23204f1b2e48SStefano Zampini PetscInt i; 23215408967cSStefano Zampini PetscErrorCode ierr; 23225408967cSStefano Zampini 23235408967cSStefano Zampini PetscFunctionBegin; 2324dee84bffSStefano Zampini ierr = PCBDDCGraphGetDirichletDofs(pcbddc->mat_graph,&dirIS);CHKERRQ(ierr); 23255408967cSStefano Zampini if (zerodiag) { 23265408967cSStefano Zampini Mat A; 23275408967cSStefano Zampini Vec vec3_N; 23285408967cSStefano Zampini PetscScalar *vals; 23295408967cSStefano Zampini const PetscInt *idxs; 2330d12d3064SStefano Zampini PetscInt nz,*count; 23315408967cSStefano Zampini 23325408967cSStefano Zampini /* p0 */ 23335408967cSStefano Zampini ierr = VecSet(pcis->vec1_N,0.);CHKERRQ(ierr); 23345408967cSStefano Zampini ierr = PetscMalloc1(pcis->n,&vals);CHKERRQ(ierr); 23355408967cSStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 23365408967cSStefano Zampini ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr); 23374f1b2e48SStefano Zampini for (i=0;i<nz;i++) vals[i] = 1.; 23385408967cSStefano Zampini ierr = VecSetValues(pcis->vec1_N,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23395408967cSStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 23405408967cSStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 23415408967cSStefano Zampini /* v_I */ 23425408967cSStefano Zampini ierr = VecSetRandom(pcis->vec2_N,NULL);CHKERRQ(ierr); 23435408967cSStefano Zampini for (i=0;i<nz;i++) vals[i] = 0.; 23445408967cSStefano Zampini ierr = VecSetValues(pcis->vec2_N,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23455408967cSStefano Zampini ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr); 23465408967cSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 23475408967cSStefano Zampini for (i=0;i<pcis->n_B;i++) vals[i] = 0.; 23485408967cSStefano Zampini ierr = VecSetValues(pcis->vec2_N,pcis->n_B,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23495408967cSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 23505408967cSStefano Zampini if (dirIS) { 23515408967cSStefano Zampini PetscInt n; 23525408967cSStefano Zampini 23535408967cSStefano Zampini ierr = ISGetLocalSize(dirIS,&n);CHKERRQ(ierr); 23545408967cSStefano Zampini ierr = ISGetIndices(dirIS,&idxs);CHKERRQ(ierr); 23555408967cSStefano Zampini for (i=0;i<n;i++) vals[i] = 0.; 23565408967cSStefano Zampini ierr = VecSetValues(pcis->vec2_N,n,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 23575408967cSStefano Zampini ierr = ISRestoreIndices(dirIS,&idxs);CHKERRQ(ierr); 23585408967cSStefano Zampini } 23595408967cSStefano Zampini ierr = VecAssemblyBegin(pcis->vec2_N);CHKERRQ(ierr); 23605408967cSStefano Zampini ierr = VecAssemblyEnd(pcis->vec2_N);CHKERRQ(ierr); 23615408967cSStefano Zampini ierr = VecDuplicate(pcis->vec1_N,&vec3_N);CHKERRQ(ierr); 23625408967cSStefano Zampini ierr = VecSet(vec3_N,0.);CHKERRQ(ierr); 2363669cc0f4SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 23645408967cSStefano Zampini ierr = MatMult(A,pcis->vec1_N,vec3_N);CHKERRQ(ierr); 23655408967cSStefano Zampini ierr = VecDot(vec3_N,pcis->vec2_N,&vals[0]);CHKERRQ(ierr); 23669a962809SStefano Zampini if (PetscAbsScalar(vals[0]) > 1.e-1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Benign trick can not be applied! b(v_I,p_0) = %1.6e (should be numerically 0.)",PetscAbsScalar(vals[0])); 23675408967cSStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 23685408967cSStefano Zampini ierr = VecDestroy(&vec3_N);CHKERRQ(ierr); 2369d12d3064SStefano Zampini 2370d12d3064SStefano Zampini /* there should not be any pressure dofs lying on the interface */ 2371d12d3064SStefano Zampini ierr = PetscCalloc1(pcis->n,&count);CHKERRQ(ierr); 2372d12d3064SStefano Zampini ierr = ISGetIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 2373d12d3064SStefano Zampini for (i=0;i<pcis->n_B;i++) count[idxs[i]]++; 2374d12d3064SStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,&idxs);CHKERRQ(ierr); 2375d12d3064SStefano Zampini ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr); 23769a962809SStefano Zampini for (i=0;i<nz;i++) if (count[idxs[i]]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Benign trick can not be applied! pressure dof %d is an interface dof",idxs[i]); 2377d12d3064SStefano Zampini ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr); 2378d12d3064SStefano Zampini ierr = PetscFree(count);CHKERRQ(ierr); 23795408967cSStefano Zampini } 2380dee84bffSStefano Zampini ierr = ISDestroy(&dirIS);CHKERRQ(ierr); 23815408967cSStefano Zampini 23825408967cSStefano Zampini /* check PCBDDCBenignGetOrSetP0 */ 23835408967cSStefano Zampini ierr = VecSetRandom(pcis->vec1_global,NULL);CHKERRQ(ierr); 23844f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = -PetscGlobalRank-i; 23855408967cSStefano Zampini ierr = PCBDDCBenignGetOrSetP0(pc,pcis->vec1_global,PETSC_FALSE);CHKERRQ(ierr); 23864f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = 1; 23875408967cSStefano Zampini ierr = PCBDDCBenignGetOrSetP0(pc,pcis->vec1_global,PETSC_TRUE);CHKERRQ(ierr); 2388f2a566d8SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 2389f2a566d8SStefano Zampini PetscInt val = PetscRealPart(pcbddc->benign_p0[i]); 2390f2a566d8SStefano Zampini if (val != -PetscGlobalRank-i) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error testing PCBDDCBenignGetOrSetP0! Found %g at %d instead of %g\n",PetscRealPart(pcbddc->benign_p0[i]),i,-PetscGlobalRank-i);CHKERRQ(ierr); 2391f2a566d8SStefano Zampini } 23925408967cSStefano Zampini PetscFunctionReturn(0); 23935408967cSStefano Zampini } 23945408967cSStefano Zampini 2395339f8db1SStefano Zampini PetscErrorCode PCBDDCBenignDetectSaddlePoint(PC pc, IS *zerodiaglocal) 2396339f8db1SStefano Zampini { 2397339f8db1SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 23984edc6404Sstefano_zampini IS pressures,zerodiag,zerodiag_save,*zerodiag_subs; 2399b0f5fe93SStefano Zampini PetscInt nz,n; 24004edc6404Sstefano_zampini PetscInt *interior_dofs,n_interior_dofs,nneu; 24014edc6404Sstefano_zampini PetscBool sorted,have_null,has_null_pressures,recompute_zerodiag,checkb; 2402339f8db1SStefano Zampini PetscErrorCode ierr; 2403339f8db1SStefano Zampini 2404339f8db1SStefano Zampini PetscFunctionBegin; 24059f47a83aSStefano Zampini ierr = PetscSFDestroy(&pcbddc->benign_sf);CHKERRQ(ierr); 24069f47a83aSStefano Zampini ierr = MatDestroy(&pcbddc->benign_B0);CHKERRQ(ierr); 2407a3df083aSStefano Zampini for (n=0;n<pcbddc->benign_n;n++) { 2408a3df083aSStefano Zampini ierr = ISDestroy(&pcbddc->benign_zerodiag_subs[n]);CHKERRQ(ierr); 2409a3df083aSStefano Zampini } 2410a3df083aSStefano Zampini ierr = PetscFree(pcbddc->benign_zerodiag_subs);CHKERRQ(ierr); 2411a3df083aSStefano Zampini pcbddc->benign_n = 0; 241228b8efb1Sstefano_zampini 241328b8efb1Sstefano_zampini /* if a local info on dofs is present, uses the last field for "pressures" (or fid by command line) 24144f1b2e48SStefano Zampini otherwise, it uses only zerodiagonal dofs (ok if the pressure block is all zero; it could fail if it is not) 24154f1b2e48SStefano Zampini Checks if all the pressure dofs in each subdomain have a zero diagonal 24164f1b2e48SStefano Zampini If not, a change of basis on pressures is not needed 24171ae86dd6SStefano Zampini since the local Schur complements are already SPD 24184f1b2e48SStefano Zampini */ 24194f1b2e48SStefano Zampini has_null_pressures = PETSC_TRUE; 24204f1b2e48SStefano Zampini have_null = PETSC_TRUE; 242140fa8d13SStefano Zampini if (pcbddc->n_ISForDofsLocal) { 24227fbe2174Sstefano_zampini IS iP = NULL; 24234f1b2e48SStefano Zampini PetscInt npl,*idxs,p = pcbddc->n_ISForDofsLocal-1; 24244f1b2e48SStefano Zampini 242528b8efb1Sstefano_zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)pc),((PetscObject)pc)->prefix,"BDDC benign options","PC");CHKERRQ(ierr); 242628b8efb1Sstefano_zampini ierr = PetscOptionsInt("-pc_bddc_pressure_field","Field id for pressures",NULL,p,&p,NULL);CHKERRQ(ierr); 242728b8efb1Sstefano_zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 242828b8efb1Sstefano_zampini if (p < 0 || p > pcbddc->n_ISForDofsLocal-1) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Invalid field id for pressures %D",p); 24294f1b2e48SStefano Zampini /* Dofs splitting for BDDC cannot have PETSC_COMM_SELF, so create a sequential IS */ 24304f1b2e48SStefano Zampini ierr = ISGetLocalSize(pcbddc->ISForDofsLocal[p],&npl);CHKERRQ(ierr); 24314f1b2e48SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofsLocal[p],(const PetscInt**)&idxs);CHKERRQ(ierr); 24324f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,npl,idxs,PETSC_COPY_VALUES,&pressures);CHKERRQ(ierr); 2433ba14f8e3SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofsLocal[p],(const PetscInt**)&idxs);CHKERRQ(ierr); 24347fbe2174Sstefano_zampini /* remove zeroed out pressures if we are setting up a BDDC solver for a saddle-point FETI-DP */ 24357fbe2174Sstefano_zampini ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_lP",(PetscObject*)&iP);CHKERRQ(ierr); 24367fbe2174Sstefano_zampini if (iP) { 24377fbe2174Sstefano_zampini IS newpressures; 24387fbe2174Sstefano_zampini 24397fbe2174Sstefano_zampini ierr = ISDifference(pressures,iP,&newpressures);CHKERRQ(ierr); 24407fbe2174Sstefano_zampini ierr = ISDestroy(&pressures);CHKERRQ(ierr); 24417fbe2174Sstefano_zampini pressures = newpressures; 24427fbe2174Sstefano_zampini } 244340fa8d13SStefano Zampini ierr = ISSorted(pressures,&sorted);CHKERRQ(ierr); 244440fa8d13SStefano Zampini if (!sorted) { 244540fa8d13SStefano Zampini ierr = ISSort(pressures);CHKERRQ(ierr); 244640fa8d13SStefano Zampini } 244740fa8d13SStefano Zampini } else { 244840fa8d13SStefano Zampini pressures = NULL; 244940fa8d13SStefano Zampini } 245097d764eeSStefano Zampini /* pcis has not been setup yet, so get the local size from the subdomain matrix */ 245197d764eeSStefano Zampini ierr = MatGetLocalSize(pcbddc->local_mat,&n,NULL);CHKERRQ(ierr); 245227b6a85dSStefano Zampini if (!n) pcbddc->benign_change_explicit = PETSC_TRUE; 245397d764eeSStefano Zampini ierr = MatFindZeroDiagonals(pcbddc->local_mat,&zerodiag);CHKERRQ(ierr); 2454339f8db1SStefano Zampini ierr = ISSorted(zerodiag,&sorted);CHKERRQ(ierr); 2455339f8db1SStefano Zampini if (!sorted) { 2456339f8db1SStefano Zampini ierr = ISSort(zerodiag);CHKERRQ(ierr); 2457339f8db1SStefano Zampini } 24584edc6404Sstefano_zampini ierr = PetscObjectReference((PetscObject)zerodiag);CHKERRQ(ierr); 24594edc6404Sstefano_zampini zerodiag_save = zerodiag; 2460339f8db1SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 24614f1b2e48SStefano Zampini if (!nz) { 24624f1b2e48SStefano Zampini if (n) have_null = PETSC_FALSE; 24634f1b2e48SStefano Zampini has_null_pressures = PETSC_FALSE; 246440fa8d13SStefano Zampini ierr = ISDestroy(&zerodiag);CHKERRQ(ierr); 246540fa8d13SStefano Zampini } 24664f1b2e48SStefano Zampini recompute_zerodiag = PETSC_FALSE; 24674f1b2e48SStefano Zampini /* in case disconnected subdomains info is present, split the pressures accordingly (otherwise the benign trick could fail) */ 24684f1b2e48SStefano Zampini zerodiag_subs = NULL; 24694f1b2e48SStefano Zampini pcbddc->benign_n = 0; 24701f4df5f7SStefano Zampini n_interior_dofs = 0; 24711f4df5f7SStefano Zampini interior_dofs = NULL; 24724edc6404Sstefano_zampini nneu = 0; 24734edc6404Sstefano_zampini if (pcbddc->NeumannBoundariesLocal) { 24744edc6404Sstefano_zampini ierr = ISGetLocalSize(pcbddc->NeumannBoundariesLocal,&nneu);CHKERRQ(ierr); 24754edc6404Sstefano_zampini } 24763369cb78Sstefano_zampini checkb = (PetscBool)(!pcbddc->NeumannBoundariesLocal || pcbddc->current_level); 24774edc6404Sstefano_zampini if (checkb) { /* need to compute interior nodes */ 24781f4df5f7SStefano Zampini PetscInt n,i,j; 24791f4df5f7SStefano Zampini PetscInt n_neigh,*neigh,*n_shared,**shared; 24801f4df5f7SStefano Zampini PetscInt *iwork; 24811f4df5f7SStefano Zampini 24821f4df5f7SStefano Zampini ierr = ISLocalToGlobalMappingGetSize(pc->pmat->rmap->mapping,&n);CHKERRQ(ierr); 24831f4df5f7SStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(pc->pmat->rmap->mapping,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 24841f4df5f7SStefano Zampini ierr = PetscCalloc1(n,&iwork);CHKERRQ(ierr); 24851f4df5f7SStefano Zampini ierr = PetscMalloc1(n,&interior_dofs);CHKERRQ(ierr); 248690648384SStefano Zampini for (i=1;i<n_neigh;i++) 24871f4df5f7SStefano Zampini for (j=0;j<n_shared[i];j++) 24881f4df5f7SStefano Zampini iwork[shared[i][j]] += 1; 24891f4df5f7SStefano Zampini for (i=0;i<n;i++) 24901f4df5f7SStefano Zampini if (!iwork[i]) 24911f4df5f7SStefano Zampini interior_dofs[n_interior_dofs++] = i; 24921f4df5f7SStefano Zampini ierr = PetscFree(iwork);CHKERRQ(ierr); 24931f4df5f7SStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(pc->pmat->rmap->mapping,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr); 24941f4df5f7SStefano Zampini } 24954f1b2e48SStefano Zampini if (has_null_pressures) { 24964f1b2e48SStefano Zampini IS *subs; 24974edc6404Sstefano_zampini PetscInt nsubs,i,j,nl; 24981f4df5f7SStefano Zampini const PetscInt *idxs; 24991f4df5f7SStefano Zampini PetscScalar *array; 25001f4df5f7SStefano Zampini Vec *work; 25011f4df5f7SStefano Zampini Mat_IS* matis = (Mat_IS*)(pc->pmat->data); 25024f1b2e48SStefano Zampini 25034f1b2e48SStefano Zampini subs = pcbddc->local_subs; 25044f1b2e48SStefano Zampini nsubs = pcbddc->n_local_subs; 25051f4df5f7SStefano Zampini /* these vectors are needed to check if the constant on pressures is in the kernel of the local operator B (i.e. B(v_I,p0) should be zero) */ 25064edc6404Sstefano_zampini if (checkb) { 25071f4df5f7SStefano Zampini ierr = VecDuplicateVecs(matis->y,2,&work);CHKERRQ(ierr); 25081f4df5f7SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nl);CHKERRQ(ierr); 25091f4df5f7SStefano Zampini ierr = ISGetIndices(zerodiag,&idxs);CHKERRQ(ierr); 25101f4df5f7SStefano Zampini /* work[0] = 1_p */ 25111f4df5f7SStefano Zampini ierr = VecSet(work[0],0.);CHKERRQ(ierr); 25121f4df5f7SStefano Zampini ierr = VecGetArray(work[0],&array);CHKERRQ(ierr); 25131f4df5f7SStefano Zampini for (j=0;j<nl;j++) array[idxs[j]] = 1.; 25141f4df5f7SStefano Zampini ierr = VecRestoreArray(work[0],&array);CHKERRQ(ierr); 25151f4df5f7SStefano Zampini /* work[0] = 1_v */ 25161f4df5f7SStefano Zampini ierr = VecSet(work[1],1.);CHKERRQ(ierr); 25171f4df5f7SStefano Zampini ierr = VecGetArray(work[1],&array);CHKERRQ(ierr); 25181f4df5f7SStefano Zampini for (j=0;j<nl;j++) array[idxs[j]] = 0.; 25191f4df5f7SStefano Zampini ierr = VecRestoreArray(work[1],&array);CHKERRQ(ierr); 25201f4df5f7SStefano Zampini ierr = ISRestoreIndices(zerodiag,&idxs);CHKERRQ(ierr); 25211f4df5f7SStefano Zampini } 25224f1b2e48SStefano Zampini if (nsubs > 1) { 25234f1b2e48SStefano Zampini ierr = PetscCalloc1(nsubs,&zerodiag_subs);CHKERRQ(ierr); 25244f1b2e48SStefano Zampini for (i=0;i<nsubs;i++) { 25254f1b2e48SStefano Zampini ISLocalToGlobalMapping l2g; 25264f1b2e48SStefano Zampini IS t_zerodiag_subs; 25274f1b2e48SStefano Zampini PetscInt nl; 25284f1b2e48SStefano Zampini 25294f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(subs[i],&l2g);CHKERRQ(ierr); 25304f1b2e48SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(l2g,IS_GTOLM_DROP,zerodiag,&t_zerodiag_subs);CHKERRQ(ierr); 25314f1b2e48SStefano Zampini ierr = ISGetLocalSize(t_zerodiag_subs,&nl);CHKERRQ(ierr); 25324f1b2e48SStefano Zampini if (nl) { 25334f1b2e48SStefano Zampini PetscBool valid = PETSC_TRUE; 25344f1b2e48SStefano Zampini 25354edc6404Sstefano_zampini if (checkb) { 25361f4df5f7SStefano Zampini ierr = VecSet(matis->x,0);CHKERRQ(ierr); 25371f4df5f7SStefano Zampini ierr = ISGetLocalSize(subs[i],&nl);CHKERRQ(ierr); 25381f4df5f7SStefano Zampini ierr = ISGetIndices(subs[i],&idxs);CHKERRQ(ierr); 25391f4df5f7SStefano Zampini ierr = VecGetArray(matis->x,&array);CHKERRQ(ierr); 25401f4df5f7SStefano Zampini for (j=0;j<nl;j++) array[idxs[j]] = 1.; 25411f4df5f7SStefano Zampini ierr = VecRestoreArray(matis->x,&array);CHKERRQ(ierr); 25421f4df5f7SStefano Zampini ierr = ISRestoreIndices(subs[i],&idxs);CHKERRQ(ierr); 25431f4df5f7SStefano Zampini ierr = VecPointwiseMult(matis->x,work[0],matis->x);CHKERRQ(ierr); 25441f4df5f7SStefano Zampini ierr = MatMult(matis->A,matis->x,matis->y);CHKERRQ(ierr); 25451f4df5f7SStefano Zampini ierr = VecPointwiseMult(matis->y,work[1],matis->y);CHKERRQ(ierr); 25461f4df5f7SStefano Zampini ierr = VecGetArray(matis->y,&array);CHKERRQ(ierr); 25471f4df5f7SStefano Zampini for (j=0;j<n_interior_dofs;j++) { 25481f4df5f7SStefano Zampini if (PetscAbsScalar(array[interior_dofs[j]]) > PETSC_SMALL) { 25491f4df5f7SStefano Zampini valid = PETSC_FALSE; 25501f4df5f7SStefano Zampini break; 25511f4df5f7SStefano Zampini } 25521f4df5f7SStefano Zampini } 25531f4df5f7SStefano Zampini ierr = VecRestoreArray(matis->y,&array);CHKERRQ(ierr); 25541f4df5f7SStefano Zampini } 25556632bad2Sstefano_zampini if (valid && nneu) { 25566632bad2Sstefano_zampini const PetscInt *idxs; 25571f4df5f7SStefano Zampini PetscInt nzb; 25581f4df5f7SStefano Zampini 25596632bad2Sstefano_zampini ierr = ISGetIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 25606632bad2Sstefano_zampini ierr = ISGlobalToLocalMappingApply(l2g,IS_GTOLM_DROP,nneu,idxs,&nzb,NULL);CHKERRQ(ierr); 25616632bad2Sstefano_zampini ierr = ISRestoreIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 25621f4df5f7SStefano Zampini if (nzb) valid = PETSC_FALSE; 25631f4df5f7SStefano Zampini } 25641f4df5f7SStefano Zampini if (valid && pressures) { 25654f1b2e48SStefano Zampini IS t_pressure_subs; 25664f1b2e48SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(l2g,IS_GTOLM_DROP,pressures,&t_pressure_subs);CHKERRQ(ierr); 25674f1b2e48SStefano Zampini ierr = ISEqual(t_pressure_subs,t_zerodiag_subs,&valid);CHKERRQ(ierr); 25684f1b2e48SStefano Zampini ierr = ISDestroy(&t_pressure_subs);CHKERRQ(ierr); 25694f1b2e48SStefano Zampini } 25704f1b2e48SStefano Zampini if (valid) { 25714f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(l2g,t_zerodiag_subs,&zerodiag_subs[pcbddc->benign_n]);CHKERRQ(ierr); 25724f1b2e48SStefano Zampini pcbddc->benign_n++; 25734f1b2e48SStefano Zampini } else { 25744f1b2e48SStefano Zampini recompute_zerodiag = PETSC_TRUE; 25754f1b2e48SStefano Zampini } 25764f1b2e48SStefano Zampini } 25774f1b2e48SStefano Zampini ierr = ISDestroy(&t_zerodiag_subs);CHKERRQ(ierr); 25784f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2g);CHKERRQ(ierr); 25794f1b2e48SStefano Zampini } 25804f1b2e48SStefano Zampini } else { /* there's just one subdomain (or zero if they have not been detected */ 25814f1b2e48SStefano Zampini PetscBool valid = PETSC_TRUE; 25821f4df5f7SStefano Zampini 25836632bad2Sstefano_zampini if (nneu) valid = PETSC_FALSE; 25841f4df5f7SStefano Zampini if (valid && pressures) { 25854f1b2e48SStefano Zampini ierr = ISEqual(pressures,zerodiag,&valid);CHKERRQ(ierr); 25864f1b2e48SStefano Zampini } 25874edc6404Sstefano_zampini if (valid && checkb) { 25881f4df5f7SStefano Zampini ierr = MatMult(matis->A,work[0],matis->x);CHKERRQ(ierr); 25891f4df5f7SStefano Zampini ierr = VecPointwiseMult(matis->x,work[1],matis->x);CHKERRQ(ierr); 25901f4df5f7SStefano Zampini ierr = VecGetArray(matis->x,&array);CHKERRQ(ierr); 25911f4df5f7SStefano Zampini for (j=0;j<n_interior_dofs;j++) { 25921f4df5f7SStefano Zampini if (PetscAbsScalar(array[interior_dofs[j]]) > PETSC_SMALL) { 25931f4df5f7SStefano Zampini valid = PETSC_FALSE; 25941f4df5f7SStefano Zampini break; 25951f4df5f7SStefano Zampini } 25961f4df5f7SStefano Zampini } 25971f4df5f7SStefano Zampini ierr = VecRestoreArray(matis->x,&array);CHKERRQ(ierr); 25981f4df5f7SStefano Zampini } 25994f1b2e48SStefano Zampini if (valid) { 26004f1b2e48SStefano Zampini pcbddc->benign_n = 1; 2601ca92afb2SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&zerodiag_subs);CHKERRQ(ierr); 26024f1b2e48SStefano Zampini ierr = PetscObjectReference((PetscObject)zerodiag);CHKERRQ(ierr); 26034f1b2e48SStefano Zampini zerodiag_subs[0] = zerodiag; 26044f1b2e48SStefano Zampini } 26054f1b2e48SStefano Zampini } 26064edc6404Sstefano_zampini if (checkb) { 26071f4df5f7SStefano Zampini ierr = VecDestroyVecs(2,&work);CHKERRQ(ierr); 26084f1b2e48SStefano Zampini } 26091f4df5f7SStefano Zampini } 26101f4df5f7SStefano Zampini ierr = PetscFree(interior_dofs);CHKERRQ(ierr); 26114f1b2e48SStefano Zampini 26124f1b2e48SStefano Zampini if (!pcbddc->benign_n) { 2613b9b0e38cSStefano Zampini PetscInt n; 2614b9b0e38cSStefano Zampini 26154f1b2e48SStefano Zampini ierr = ISDestroy(&zerodiag);CHKERRQ(ierr); 26164f1b2e48SStefano Zampini recompute_zerodiag = PETSC_FALSE; 2617b9b0e38cSStefano Zampini ierr = MatGetLocalSize(pcbddc->local_mat,&n,NULL);CHKERRQ(ierr); 2618b9b0e38cSStefano Zampini if (n) { 26194f1b2e48SStefano Zampini has_null_pressures = PETSC_FALSE; 26204f1b2e48SStefano Zampini have_null = PETSC_FALSE; 26214f1b2e48SStefano Zampini } 2622b9b0e38cSStefano Zampini } 26234f1b2e48SStefano Zampini 26244f1b2e48SStefano Zampini /* final check for null pressures */ 26254f1b2e48SStefano Zampini if (zerodiag && pressures) { 26264f1b2e48SStefano Zampini PetscInt nz,np; 26274f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 26284f1b2e48SStefano Zampini ierr = ISGetLocalSize(pressures,&np);CHKERRQ(ierr); 26294f1b2e48SStefano Zampini if (nz != np) have_null = PETSC_FALSE; 26304f1b2e48SStefano Zampini } 26314f1b2e48SStefano Zampini 26324f1b2e48SStefano Zampini if (recompute_zerodiag) { 26334f1b2e48SStefano Zampini ierr = ISDestroy(&zerodiag);CHKERRQ(ierr); 26344f1b2e48SStefano Zampini if (pcbddc->benign_n == 1) { 26354f1b2e48SStefano Zampini ierr = PetscObjectReference((PetscObject)zerodiag_subs[0]);CHKERRQ(ierr); 26364f1b2e48SStefano Zampini zerodiag = zerodiag_subs[0]; 26374f1b2e48SStefano Zampini } else { 26384f1b2e48SStefano Zampini PetscInt i,nzn,*new_idxs; 26394f1b2e48SStefano Zampini 26404f1b2e48SStefano Zampini nzn = 0; 26414f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 26424f1b2e48SStefano Zampini PetscInt ns; 26434f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[i],&ns);CHKERRQ(ierr); 26444f1b2e48SStefano Zampini nzn += ns; 26454f1b2e48SStefano Zampini } 26464f1b2e48SStefano Zampini ierr = PetscMalloc1(nzn,&new_idxs);CHKERRQ(ierr); 26474f1b2e48SStefano Zampini nzn = 0; 26484f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 26494f1b2e48SStefano Zampini PetscInt ns,*idxs; 26504f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[i],&ns);CHKERRQ(ierr); 26514f1b2e48SStefano Zampini ierr = ISGetIndices(zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 26524f1b2e48SStefano Zampini ierr = PetscMemcpy(new_idxs+nzn,idxs,ns*sizeof(PetscInt));CHKERRQ(ierr); 26534f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 26544f1b2e48SStefano Zampini nzn += ns; 26554f1b2e48SStefano Zampini } 26564f1b2e48SStefano Zampini ierr = PetscSortInt(nzn,new_idxs);CHKERRQ(ierr); 26574f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nzn,new_idxs,PETSC_OWN_POINTER,&zerodiag);CHKERRQ(ierr); 26584f1b2e48SStefano Zampini } 26594f1b2e48SStefano Zampini have_null = PETSC_FALSE; 26604f1b2e48SStefano Zampini } 26614f1b2e48SStefano Zampini 2662669cc0f4SStefano Zampini /* Prepare matrix to compute no-net-flux */ 2663a198735bSStefano Zampini if (pcbddc->compute_nonetflux && !pcbddc->divudotp) { 2664a198735bSStefano Zampini Mat A,loc_divudotp; 2665a198735bSStefano Zampini ISLocalToGlobalMapping rl2g,cl2g,l2gmap; 2666a198735bSStefano Zampini IS row,col,isused = NULL; 2667a198735bSStefano Zampini PetscInt M,N,n,st,n_isused; 2668a198735bSStefano Zampini 26691f4df5f7SStefano Zampini if (pressures) { 26701f4df5f7SStefano Zampini isused = pressures; 26711f4df5f7SStefano Zampini } else { 26724edc6404Sstefano_zampini isused = zerodiag_save; 26731f4df5f7SStefano Zampini } 2674a198735bSStefano Zampini ierr = MatGetLocalToGlobalMapping(pc->pmat,&l2gmap,NULL);CHKERRQ(ierr); 2675669cc0f4SStefano Zampini ierr = MatISGetLocalMat(pc->pmat,&A);CHKERRQ(ierr); 26761ae86dd6SStefano Zampini ierr = MatGetLocalSize(A,&n,NULL);CHKERRQ(ierr); 26771ae86dd6SStefano Zampini if (!isused && n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Don't know how to extract div u dot p! Please provide the pressure field"); 2678a198735bSStefano Zampini n_isused = 0; 2679a198735bSStefano Zampini if (isused) { 2680a198735bSStefano Zampini ierr = ISGetLocalSize(isused,&n_isused);CHKERRQ(ierr); 2681a198735bSStefano Zampini } 2682a198735bSStefano Zampini ierr = MPI_Scan(&n_isused,&st,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 2683a198735bSStefano Zampini st = st-n_isused; 26841ae86dd6SStefano Zampini if (n) { 2685a198735bSStefano Zampini const PetscInt *gidxs; 2686a198735bSStefano Zampini 26877dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,isused,NULL,MAT_INITIAL_MATRIX,&loc_divudotp);CHKERRQ(ierr); 2688a198735bSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(l2gmap,&gidxs);CHKERRQ(ierr); 2689a198735bSStefano Zampini /* TODO: extend ISCreateStride with st = PETSC_DECIDE */ 2690a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n_isused,st,1,&row);CHKERRQ(ierr); 2691a198735bSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),n,gidxs,PETSC_COPY_VALUES,&col);CHKERRQ(ierr); 2692a198735bSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap,&gidxs);CHKERRQ(ierr); 26931ae86dd6SStefano Zampini } else { 2694a198735bSStefano Zampini ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,0,0,1,NULL,&loc_divudotp);CHKERRQ(ierr); 2695a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),n_isused,st,1,&row);CHKERRQ(ierr); 2696a198735bSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),0,NULL,PETSC_COPY_VALUES,&col);CHKERRQ(ierr); 2697a198735bSStefano Zampini } 2698a198735bSStefano Zampini ierr = MatGetSize(pc->pmat,NULL,&N);CHKERRQ(ierr); 2699a198735bSStefano Zampini ierr = ISGetSize(row,&M);CHKERRQ(ierr); 2700a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(row,&rl2g);CHKERRQ(ierr); 2701a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(col,&cl2g);CHKERRQ(ierr); 2702a198735bSStefano Zampini ierr = ISDestroy(&row);CHKERRQ(ierr); 2703a198735bSStefano Zampini ierr = ISDestroy(&col);CHKERRQ(ierr); 2704a198735bSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pc),&pcbddc->divudotp);CHKERRQ(ierr); 2705a198735bSStefano Zampini ierr = MatSetType(pcbddc->divudotp,MATIS);CHKERRQ(ierr); 2706a198735bSStefano Zampini ierr = MatSetSizes(pcbddc->divudotp,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 2707a198735bSStefano Zampini ierr = MatSetLocalToGlobalMapping(pcbddc->divudotp,rl2g,cl2g);CHKERRQ(ierr); 2708a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&rl2g);CHKERRQ(ierr); 2709a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cl2g);CHKERRQ(ierr); 2710a198735bSStefano Zampini ierr = MatISSetLocalMat(pcbddc->divudotp,loc_divudotp);CHKERRQ(ierr); 2711a198735bSStefano Zampini ierr = MatDestroy(&loc_divudotp);CHKERRQ(ierr); 27121ae86dd6SStefano Zampini ierr = MatAssemblyBegin(pcbddc->divudotp,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 27131ae86dd6SStefano Zampini ierr = MatAssemblyEnd(pcbddc->divudotp,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 27141ae86dd6SStefano Zampini } 27154edc6404Sstefano_zampini ierr = ISDestroy(&zerodiag_save);CHKERRQ(ierr); 2716b3afcdbeSStefano Zampini 2717b3afcdbeSStefano Zampini /* change of basis and p0 dofs */ 27184f1b2e48SStefano Zampini if (has_null_pressures) { 27194f1b2e48SStefano Zampini IS zerodiagc; 27204f1b2e48SStefano Zampini const PetscInt *idxs,*idxsc; 27214f1b2e48SStefano Zampini PetscInt i,s,*nnz; 27224f1b2e48SStefano Zampini 27234f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag,&nz);CHKERRQ(ierr); 2724339f8db1SStefano Zampini ierr = ISComplement(zerodiag,0,n,&zerodiagc);CHKERRQ(ierr); 2725339f8db1SStefano Zampini ierr = ISGetIndices(zerodiagc,&idxsc);CHKERRQ(ierr); 2726339f8db1SStefano Zampini /* local change of basis for pressures */ 2727339f8db1SStefano Zampini ierr = MatDestroy(&pcbddc->benign_change);CHKERRQ(ierr); 272897d764eeSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pcbddc->local_mat),&pcbddc->benign_change);CHKERRQ(ierr); 2729339f8db1SStefano Zampini ierr = MatSetType(pcbddc->benign_change,MATAIJ);CHKERRQ(ierr); 2730339f8db1SStefano Zampini ierr = MatSetSizes(pcbddc->benign_change,n,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 2731339f8db1SStefano Zampini ierr = PetscMalloc1(n,&nnz);CHKERRQ(ierr); 27324f1b2e48SStefano Zampini for (i=0;i<n-nz;i++) nnz[idxsc[i]] = 1; /* identity on velocities plus pressure dofs for non-singular subdomains */ 27334f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 27344f1b2e48SStefano Zampini PetscInt nzs,j; 27354f1b2e48SStefano Zampini 27364f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[i],&nzs);CHKERRQ(ierr); 27374f1b2e48SStefano Zampini ierr = ISGetIndices(zerodiag_subs[i],&idxs);CHKERRQ(ierr); 27384f1b2e48SStefano Zampini for (j=0;j<nzs-1;j++) nnz[idxs[j]] = 2; /* change on pressures */ 27394f1b2e48SStefano Zampini nnz[idxs[nzs-1]] = nzs; /* last local pressure dof in subdomain */ 27404f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiag_subs[i],&idxs);CHKERRQ(ierr); 27414f1b2e48SStefano Zampini } 2742339f8db1SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->benign_change,0,nnz);CHKERRQ(ierr); 2743339f8db1SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2744339f8db1SStefano Zampini /* set identity on velocities */ 2745339f8db1SStefano Zampini for (i=0;i<n-nz;i++) { 2746339f8db1SStefano Zampini ierr = MatSetValue(pcbddc->benign_change,idxsc[i],idxsc[i],1.,INSERT_VALUES);CHKERRQ(ierr); 2747339f8db1SStefano Zampini } 27484f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiagc,&idxsc);CHKERRQ(ierr); 27494f1b2e48SStefano Zampini ierr = ISDestroy(&zerodiagc);CHKERRQ(ierr); 27509f47a83aSStefano Zampini ierr = PetscFree3(pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx,pcbddc->benign_p0);CHKERRQ(ierr); 27514f1b2e48SStefano Zampini ierr = PetscMalloc3(pcbddc->benign_n,&pcbddc->benign_p0_lidx,pcbddc->benign_n,&pcbddc->benign_p0_gidx,pcbddc->benign_n,&pcbddc->benign_p0);CHKERRQ(ierr); 2752339f8db1SStefano Zampini /* set change on pressures */ 27534f1b2e48SStefano Zampini for (s=0;s<pcbddc->benign_n;s++) { 27544f1b2e48SStefano Zampini PetscScalar *array; 27554f1b2e48SStefano Zampini PetscInt nzs; 27564f1b2e48SStefano Zampini 27574f1b2e48SStefano Zampini ierr = ISGetLocalSize(zerodiag_subs[s],&nzs);CHKERRQ(ierr); 27584f1b2e48SStefano Zampini ierr = ISGetIndices(zerodiag_subs[s],&idxs);CHKERRQ(ierr); 27594f1b2e48SStefano Zampini for (i=0;i<nzs-1;i++) { 2760339f8db1SStefano Zampini PetscScalar vals[2]; 2761339f8db1SStefano Zampini PetscInt cols[2]; 2762339f8db1SStefano Zampini 2763339f8db1SStefano Zampini cols[0] = idxs[i]; 27644f1b2e48SStefano Zampini cols[1] = idxs[nzs-1]; 2765339f8db1SStefano Zampini vals[0] = 1.; 2766b0f5fe93SStefano Zampini vals[1] = 1.; 27674f1b2e48SStefano Zampini ierr = MatSetValues(pcbddc->benign_change,1,cols,2,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 2768339f8db1SStefano Zampini } 27694f1b2e48SStefano Zampini ierr = PetscMalloc1(nzs,&array);CHKERRQ(ierr); 27704f1b2e48SStefano Zampini for (i=0;i<nzs-1;i++) array[i] = -1.; 27714f1b2e48SStefano Zampini array[nzs-1] = 1.; 27724f1b2e48SStefano Zampini ierr = MatSetValues(pcbddc->benign_change,1,idxs+nzs-1,nzs,idxs,array,INSERT_VALUES);CHKERRQ(ierr); 27734f1b2e48SStefano Zampini /* store local idxs for p0 */ 27744f1b2e48SStefano Zampini pcbddc->benign_p0_lidx[s] = idxs[nzs-1]; 27754f1b2e48SStefano Zampini ierr = ISRestoreIndices(zerodiag_subs[s],&idxs);CHKERRQ(ierr); 2776339f8db1SStefano Zampini ierr = PetscFree(array);CHKERRQ(ierr); 27774f1b2e48SStefano Zampini } 2778339f8db1SStefano Zampini ierr = MatAssemblyBegin(pcbddc->benign_change,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2779339f8db1SStefano Zampini ierr = MatAssemblyEnd(pcbddc->benign_change,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2780a3df083aSStefano Zampini /* project if needed */ 2781a3df083aSStefano Zampini if (pcbddc->benign_change_explicit) { 27821dd7afcfSStefano Zampini Mat M; 27831dd7afcfSStefano Zampini 27841dd7afcfSStefano Zampini ierr = MatPtAP(pcbddc->local_mat,pcbddc->benign_change,MAT_INITIAL_MATRIX,2.0,&M);CHKERRQ(ierr); 2785339f8db1SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 27861dd7afcfSStefano Zampini ierr = MatSeqAIJCompress(M,&pcbddc->local_mat);CHKERRQ(ierr); 27871dd7afcfSStefano Zampini ierr = MatDestroy(&M);CHKERRQ(ierr); 2788a3df083aSStefano Zampini } 27894f1b2e48SStefano Zampini /* store global idxs for p0 */ 27904f1b2e48SStefano Zampini ierr = ISLocalToGlobalMappingApply(pc->pmat->rmap->mapping,pcbddc->benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx);CHKERRQ(ierr); 2791339f8db1SStefano Zampini } 2792ca92afb2SStefano Zampini pcbddc->benign_zerodiag_subs = zerodiag_subs; 27934f1b2e48SStefano Zampini ierr = ISDestroy(&pressures);CHKERRQ(ierr); 2794b0f5fe93SStefano Zampini 2795b0f5fe93SStefano Zampini /* determines if the coarse solver will be singular or not */ 2796b0f5fe93SStefano Zampini ierr = MPI_Allreduce(&have_null,&pcbddc->benign_null,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 279727b6a85dSStefano Zampini /* determines if the problem has subdomains with 0 pressure block */ 279827b6a85dSStefano Zampini ierr = MPI_Allreduce(&have_null,&pcbddc->benign_have_null,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 2799339f8db1SStefano Zampini *zerodiaglocal = zerodiag; 2800339f8db1SStefano Zampini PetscFunctionReturn(0); 2801339f8db1SStefano Zampini } 2802339f8db1SStefano Zampini 2803015636ebSStefano Zampini PetscErrorCode PCBDDCBenignGetOrSetP0(PC pc, Vec v, PetscBool get) 2804efc2fbd9SStefano Zampini { 2805efc2fbd9SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 2806de9d7bd0SStefano Zampini PetscScalar *array; 2807efc2fbd9SStefano Zampini PetscErrorCode ierr; 2808efc2fbd9SStefano Zampini 2809efc2fbd9SStefano Zampini PetscFunctionBegin; 2810efc2fbd9SStefano Zampini if (!pcbddc->benign_sf) { 2811efc2fbd9SStefano Zampini ierr = PetscSFCreate(PetscObjectComm((PetscObject)pc),&pcbddc->benign_sf);CHKERRQ(ierr); 28124f1b2e48SStefano Zampini ierr = PetscSFSetGraphLayout(pcbddc->benign_sf,pc->pmat->rmap,pcbddc->benign_n,NULL,PETSC_OWN_POINTER,pcbddc->benign_p0_gidx);CHKERRQ(ierr); 2813efc2fbd9SStefano Zampini } 2814de9d7bd0SStefano Zampini if (get) { 2815efc2fbd9SStefano Zampini ierr = VecGetArrayRead(v,(const PetscScalar**)&array);CHKERRQ(ierr); 28164f1b2e48SStefano Zampini ierr = PetscSFBcastBegin(pcbddc->benign_sf,MPIU_SCALAR,array,pcbddc->benign_p0);CHKERRQ(ierr); 28174f1b2e48SStefano Zampini ierr = PetscSFBcastEnd(pcbddc->benign_sf,MPIU_SCALAR,array,pcbddc->benign_p0);CHKERRQ(ierr); 2818efc2fbd9SStefano Zampini ierr = VecRestoreArrayRead(v,(const PetscScalar**)&array);CHKERRQ(ierr); 2819de9d7bd0SStefano Zampini } else { 2820de9d7bd0SStefano Zampini ierr = VecGetArray(v,&array);CHKERRQ(ierr); 2821de9d7bd0SStefano Zampini ierr = PetscSFReduceBegin(pcbddc->benign_sf,MPIU_SCALAR,pcbddc->benign_p0,array,MPIU_REPLACE);CHKERRQ(ierr); 2822de9d7bd0SStefano Zampini ierr = PetscSFReduceEnd(pcbddc->benign_sf,MPIU_SCALAR,pcbddc->benign_p0,array,MPIU_REPLACE);CHKERRQ(ierr); 2823de9d7bd0SStefano Zampini ierr = VecRestoreArray(v,&array);CHKERRQ(ierr); 2824efc2fbd9SStefano Zampini } 2825efc2fbd9SStefano Zampini PetscFunctionReturn(0); 2826efc2fbd9SStefano Zampini } 2827efc2fbd9SStefano Zampini 2828c263805aSStefano Zampini PetscErrorCode PCBDDCBenignPopOrPushB0(PC pc, PetscBool pop) 2829c263805aSStefano Zampini { 2830c263805aSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 2831c263805aSStefano Zampini PetscErrorCode ierr; 2832c263805aSStefano Zampini 2833c263805aSStefano Zampini PetscFunctionBegin; 2834c263805aSStefano Zampini /* TODO: add error checking 2835c263805aSStefano Zampini - avoid nested pop (or push) calls. 2836c263805aSStefano Zampini - cannot push before pop. 28371c604dc7SStefano Zampini - cannot call this if pcbddc->local_mat is NULL 2838c263805aSStefano Zampini */ 28394f1b2e48SStefano Zampini if (!pcbddc->benign_n) { 2840efc2fbd9SStefano Zampini PetscFunctionReturn(0); 2841efc2fbd9SStefano Zampini } 2842c263805aSStefano Zampini if (pop) { 2843a3df083aSStefano Zampini if (pcbddc->benign_change_explicit) { 28444f1b2e48SStefano Zampini IS is_p0; 28454f1b2e48SStefano Zampini MatReuse reuse; 2846c263805aSStefano Zampini 2847c263805aSStefano Zampini /* extract B_0 */ 28484f1b2e48SStefano Zampini reuse = MAT_INITIAL_MATRIX; 28494f1b2e48SStefano Zampini if (pcbddc->benign_B0) { 28504f1b2e48SStefano Zampini reuse = MAT_REUSE_MATRIX; 28514f1b2e48SStefano Zampini } 28524f1b2e48SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->benign_n,pcbddc->benign_p0_lidx,PETSC_COPY_VALUES,&is_p0);CHKERRQ(ierr); 28537dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,is_p0,NULL,reuse,&pcbddc->benign_B0);CHKERRQ(ierr); 2854c263805aSStefano Zampini /* remove rows and cols from local problem */ 2855c263805aSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_KEEP_NONZERO_PATTERN,PETSC_TRUE);CHKERRQ(ierr); 285697d764eeSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 28574f1b2e48SStefano Zampini ierr = MatZeroRowsColumnsIS(pcbddc->local_mat,is_p0,1.0,NULL,NULL);CHKERRQ(ierr); 28584f1b2e48SStefano Zampini ierr = ISDestroy(&is_p0);CHKERRQ(ierr); 2859a3df083aSStefano Zampini } else { 2860a3df083aSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2861a3df083aSStefano Zampini PetscScalar *vals; 2862a3df083aSStefano Zampini PetscInt i,n,*idxs_ins; 2863a3df083aSStefano Zampini 2864a3df083aSStefano Zampini ierr = VecGetLocalSize(matis->y,&n);CHKERRQ(ierr); 2865a3df083aSStefano Zampini ierr = PetscMalloc2(n,&idxs_ins,n,&vals);CHKERRQ(ierr); 2866a3df083aSStefano Zampini if (!pcbddc->benign_B0) { 28670b5adadeSStefano Zampini PetscInt *nnz; 2868a3df083aSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pcbddc->local_mat),&pcbddc->benign_B0);CHKERRQ(ierr); 2869a3df083aSStefano Zampini ierr = MatSetType(pcbddc->benign_B0,MATAIJ);CHKERRQ(ierr); 2870a3df083aSStefano Zampini ierr = MatSetSizes(pcbddc->benign_B0,pcbddc->benign_n,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 2871331e053bSStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&nnz);CHKERRQ(ierr); 2872331e053bSStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 2873331e053bSStefano Zampini ierr = ISGetLocalSize(pcbddc->benign_zerodiag_subs[i],&nnz[i]);CHKERRQ(ierr); 2874331e053bSStefano Zampini nnz[i] = n - nnz[i]; 2875331e053bSStefano Zampini } 2876331e053bSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->benign_B0,0,nnz);CHKERRQ(ierr); 2877331e053bSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2878331e053bSStefano Zampini } 2879a3df083aSStefano Zampini 2880a3df083aSStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 2881a3df083aSStefano Zampini PetscScalar *array; 2882a3df083aSStefano Zampini PetscInt *idxs,j,nz,cum; 2883a3df083aSStefano Zampini 2884a3df083aSStefano Zampini ierr = VecSet(matis->x,0.);CHKERRQ(ierr); 2885a3df083aSStefano Zampini ierr = ISGetLocalSize(pcbddc->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 2886a3df083aSStefano Zampini ierr = ISGetIndices(pcbddc->benign_zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 2887a3df083aSStefano Zampini for (j=0;j<nz;j++) vals[j] = 1.; 2888a3df083aSStefano Zampini ierr = VecSetValues(matis->x,nz,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 2889a3df083aSStefano Zampini ierr = VecAssemblyBegin(matis->x);CHKERRQ(ierr); 2890a3df083aSStefano Zampini ierr = VecAssemblyEnd(matis->x);CHKERRQ(ierr); 2891a3df083aSStefano Zampini ierr = VecSet(matis->y,0.);CHKERRQ(ierr); 2892a3df083aSStefano Zampini ierr = MatMult(matis->A,matis->x,matis->y);CHKERRQ(ierr); 2893a3df083aSStefano Zampini ierr = VecGetArray(matis->y,&array);CHKERRQ(ierr); 2894a3df083aSStefano Zampini cum = 0; 2895a3df083aSStefano Zampini for (j=0;j<n;j++) { 289622db5ddcSStefano Zampini if (PetscUnlikely(PetscAbsScalar(array[j]) > PETSC_SMALL)) { 2897a3df083aSStefano Zampini vals[cum] = array[j]; 2898a3df083aSStefano Zampini idxs_ins[cum] = j; 2899a3df083aSStefano Zampini cum++; 2900a3df083aSStefano Zampini } 2901a3df083aSStefano Zampini } 2902a3df083aSStefano Zampini ierr = MatSetValues(pcbddc->benign_B0,1,&i,cum,idxs_ins,vals,INSERT_VALUES);CHKERRQ(ierr); 2903a3df083aSStefano Zampini ierr = VecRestoreArray(matis->y,&array);CHKERRQ(ierr); 2904a3df083aSStefano Zampini ierr = ISRestoreIndices(pcbddc->benign_zerodiag_subs[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 2905a3df083aSStefano Zampini } 2906a3df083aSStefano Zampini ierr = MatAssemblyBegin(pcbddc->benign_B0,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2907a3df083aSStefano Zampini ierr = MatAssemblyEnd(pcbddc->benign_B0,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2908a3df083aSStefano Zampini ierr = PetscFree2(idxs_ins,vals);CHKERRQ(ierr); 2909a3df083aSStefano Zampini } 2910c263805aSStefano Zampini } else { /* push */ 2911a3df083aSStefano Zampini if (pcbddc->benign_change_explicit) { 29124f1b2e48SStefano Zampini PetscInt i; 29134f1b2e48SStefano Zampini 29144f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 29154f1b2e48SStefano Zampini PetscScalar *B0_vals; 29164f1b2e48SStefano Zampini PetscInt *B0_cols,B0_ncol; 29174f1b2e48SStefano Zampini 29184f1b2e48SStefano Zampini ierr = MatGetRow(pcbddc->benign_B0,i,&B0_ncol,(const PetscInt**)&B0_cols,(const PetscScalar**)&B0_vals);CHKERRQ(ierr); 29194f1b2e48SStefano Zampini ierr = MatSetValues(pcbddc->local_mat,1,pcbddc->benign_p0_lidx+i,B0_ncol,B0_cols,B0_vals,INSERT_VALUES);CHKERRQ(ierr); 29207b034428SStefano Zampini ierr = MatSetValues(pcbddc->local_mat,B0_ncol,B0_cols,1,pcbddc->benign_p0_lidx+i,B0_vals,INSERT_VALUES);CHKERRQ(ierr); 29214f1b2e48SStefano Zampini ierr = MatSetValue(pcbddc->local_mat,pcbddc->benign_p0_lidx[i],pcbddc->benign_p0_lidx[i],0.0,INSERT_VALUES);CHKERRQ(ierr); 29224f1b2e48SStefano Zampini ierr = MatRestoreRow(pcbddc->benign_B0,i,&B0_ncol,(const PetscInt**)&B0_cols,(const PetscScalar**)&B0_vals);CHKERRQ(ierr); 29234f1b2e48SStefano Zampini } 2924c263805aSStefano Zampini ierr = MatAssemblyBegin(pcbddc->local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2925c263805aSStefano Zampini ierr = MatAssemblyEnd(pcbddc->local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2926a3df083aSStefano Zampini } else { 2927a3df083aSStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Cannot push B0!\n"); 2928a3df083aSStefano Zampini } 2929c263805aSStefano Zampini } 2930c263805aSStefano Zampini PetscFunctionReturn(0); 2931c263805aSStefano Zampini } 2932c263805aSStefano Zampini 293308122e43SStefano Zampini PetscErrorCode PCBDDCAdaptiveSelection(PC pc) 2934b1b3d7a2SStefano Zampini { 2935b1b3d7a2SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 293608122e43SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 293708122e43SStefano Zampini PetscBLASInt B_dummyint,B_neigs,B_ierr,B_lwork; 293808122e43SStefano Zampini PetscBLASInt *B_iwork,*B_ifail; 293908122e43SStefano Zampini PetscScalar *work,lwork; 294008122e43SStefano Zampini PetscScalar *St,*S,*eigv; 294108122e43SStefano Zampini PetscScalar *Sarray,*Starray; 294208122e43SStefano Zampini PetscReal *eigs,thresh; 29431b968477SStefano Zampini PetscInt i,nmax,nmin,nv,cum,mss,cum2,cumarray,maxneigs; 2944f6f667cfSStefano Zampini PetscBool allocated_S_St; 294508122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 294608122e43SStefano Zampini PetscReal *rwork; 294708122e43SStefano Zampini #endif 2948b1b3d7a2SStefano Zampini PetscErrorCode ierr; 2949b1b3d7a2SStefano Zampini 2950b1b3d7a2SStefano Zampini PetscFunctionBegin; 2951b334f244SStefano Zampini if (!sub_schurs) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Adaptive selection of constraints requires SubSchurs data"); 2952af25d912SStefano Zampini if (!sub_schurs->schur_explicit) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Adaptive selection of constraints requires MUMPS and/or MKL_CPARDISO"); 2953d750e150Sstefano_zampini if (sub_schurs->n_subs && (!sub_schurs->is_hermitian || !sub_schurs->is_posdef)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Adaptive selection not yet implemented for general matrix pencils (herm %d, posdef %d)\nRerun with -sub_schurs_hermitian 1 -sub_schurs_posdef 1 if the problem is SPD",sub_schurs->is_hermitian,sub_schurs->is_posdef); 295406a4e24aSStefano Zampini 2955fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 2956fd14bc51SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 2957fd14bc51SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 2958fd14bc51SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check adaptive selection of constraints\n");CHKERRQ(ierr); 29591575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 2960fd14bc51SStefano Zampini } 2961fd14bc51SStefano Zampini 2962e496cd5dSStefano Zampini if (pcbddc->dbg_flag) { 2963e496cd5dSStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d cc %d (%d,%d).\n",PetscGlobalRank,sub_schurs->n_subs,sub_schurs->is_hermitian,sub_schurs->is_posdef); 2964e496cd5dSStefano Zampini } 2965e496cd5dSStefano Zampini 296608122e43SStefano Zampini /* max size of subsets */ 296708122e43SStefano Zampini mss = 0; 296808122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 296908122e43SStefano Zampini PetscInt subset_size; 2970862806e4SStefano Zampini 297108122e43SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 297208122e43SStefano Zampini mss = PetscMax(mss,subset_size); 297308122e43SStefano Zampini } 297408122e43SStefano Zampini 297508122e43SStefano Zampini /* min/max and threshold */ 297608122e43SStefano Zampini nmax = pcbddc->adaptive_nmax > 0 ? pcbddc->adaptive_nmax : mss; 2977f6f667cfSStefano Zampini nmin = pcbddc->adaptive_nmin > 0 ? pcbddc->adaptive_nmin : 0; 297808122e43SStefano Zampini nmax = PetscMax(nmin,nmax); 2979f6f667cfSStefano Zampini allocated_S_St = PETSC_FALSE; 2980f6f667cfSStefano Zampini if (nmin) { 2981f6f667cfSStefano Zampini allocated_S_St = PETSC_TRUE; 2982f6f667cfSStefano Zampini } 298308122e43SStefano Zampini 298408122e43SStefano Zampini /* allocate lapack workspace */ 298508122e43SStefano Zampini cum = cum2 = 0; 298608122e43SStefano Zampini maxneigs = 0; 298708122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 298808122e43SStefano Zampini PetscInt n,subset_size; 2989f6f667cfSStefano Zampini 299008122e43SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 299108122e43SStefano Zampini n = PetscMin(subset_size,nmax); 29929162d606SStefano Zampini cum += subset_size; 29939162d606SStefano Zampini cum2 += subset_size*n; 299408122e43SStefano Zampini maxneigs = PetscMax(maxneigs,n); 299508122e43SStefano Zampini } 299608122e43SStefano Zampini if (mss) { 29979ab7bb16SStefano Zampini if (sub_schurs->is_hermitian && sub_schurs->is_posdef) { 299808122e43SStefano Zampini PetscBLASInt B_itype = 1; 299908122e43SStefano Zampini PetscBLASInt B_N = mss; 30004c6709b3SStefano Zampini PetscReal zero = 0.0; 30014c6709b3SStefano Zampini PetscReal eps = 0.0; /* dlamch? */ 300208122e43SStefano Zampini 300308122e43SStefano Zampini B_lwork = -1; 300408122e43SStefano Zampini S = NULL; 300508122e43SStefano Zampini St = NULL; 3006a58a30b4SStefano Zampini eigs = NULL; 3007a58a30b4SStefano Zampini eigv = NULL; 3008a58a30b4SStefano Zampini B_iwork = NULL; 3009a58a30b4SStefano Zampini B_ifail = NULL; 3010d1710679SStefano Zampini #if defined(PETSC_USE_COMPLEX) 3011d1710679SStefano Zampini rwork = NULL; 3012d1710679SStefano Zampini #endif 30138bec7fa6SStefano Zampini thresh = 1.0; 301408122e43SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 301508122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 301608122e43SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&zero,&thresh,&B_dummyint,&B_dummyint,&eps,&B_neigs,eigs,eigv,&B_N,&lwork,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 301708122e43SStefano Zampini #else 301808122e43SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&zero,&thresh,&B_dummyint,&B_dummyint,&eps,&B_neigs,eigs,eigv,&B_N,&lwork,&B_lwork,B_iwork,B_ifail,&B_ierr)); 301908122e43SStefano Zampini #endif 302008122e43SStefano Zampini if (B_ierr != 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYGVX Lapack routine %d",(int)B_ierr); 302108122e43SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 302208122e43SStefano Zampini } else { 302308122e43SStefano Zampini /* TODO */ 302408122e43SStefano Zampini } 302508122e43SStefano Zampini } else { 302608122e43SStefano Zampini lwork = 0; 302708122e43SStefano Zampini } 302808122e43SStefano Zampini 302908122e43SStefano Zampini nv = 0; 3030d62866d3SStefano Zampini if (sub_schurs->is_vertices && pcbddc->use_vertices) { /* complement set of active subsets, each entry is a vertex (boundary made by active subsets, vertices and dirichlet dofs) */ 3031d62866d3SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_vertices,&nv);CHKERRQ(ierr); 303208122e43SStefano Zampini } 30334c6709b3SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&B_lwork);CHKERRQ(ierr); 3034f6f667cfSStefano Zampini if (allocated_S_St) { 3035f6f667cfSStefano Zampini ierr = PetscMalloc2(mss*mss,&S,mss*mss,&St);CHKERRQ(ierr); 3036f6f667cfSStefano Zampini } 3037f6f667cfSStefano Zampini ierr = PetscMalloc5(mss*mss,&eigv,mss,&eigs,B_lwork,&work,5*mss,&B_iwork,mss,&B_ifail);CHKERRQ(ierr); 303808122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 303908122e43SStefano Zampini ierr = PetscMalloc1(7*mss,&rwork);CHKERRQ(ierr); 304008122e43SStefano Zampini #endif 30419162d606SStefano Zampini ierr = PetscMalloc5(nv+sub_schurs->n_subs,&pcbddc->adaptive_constraints_n, 30429162d606SStefano Zampini nv+sub_schurs->n_subs+1,&pcbddc->adaptive_constraints_idxs_ptr, 30439162d606SStefano Zampini nv+sub_schurs->n_subs+1,&pcbddc->adaptive_constraints_data_ptr, 304408122e43SStefano Zampini nv+cum,&pcbddc->adaptive_constraints_idxs, 30459162d606SStefano Zampini nv+cum2,&pcbddc->adaptive_constraints_data);CHKERRQ(ierr); 304608122e43SStefano Zampini ierr = PetscMemzero(pcbddc->adaptive_constraints_n,(nv+sub_schurs->n_subs)*sizeof(PetscInt));CHKERRQ(ierr); 304708122e43SStefano Zampini 304808122e43SStefano Zampini maxneigs = 0; 304972b8c272SStefano Zampini cum = cumarray = 0; 30509162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr[0] = 0; 30519162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr[0] = 0; 3052d62866d3SStefano Zampini if (sub_schurs->is_vertices && pcbddc->use_vertices) { 305308122e43SStefano Zampini const PetscInt *idxs; 305408122e43SStefano Zampini 3055d62866d3SStefano Zampini ierr = ISGetIndices(sub_schurs->is_vertices,&idxs);CHKERRQ(ierr); 305608122e43SStefano Zampini for (cum=0;cum<nv;cum++) { 305708122e43SStefano Zampini pcbddc->adaptive_constraints_n[cum] = 1; 305808122e43SStefano Zampini pcbddc->adaptive_constraints_idxs[cum] = idxs[cum]; 305908122e43SStefano Zampini pcbddc->adaptive_constraints_data[cum] = 1.0; 30609162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr[cum+1] = pcbddc->adaptive_constraints_idxs_ptr[cum]+1; 30619162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr[cum+1] = pcbddc->adaptive_constraints_data_ptr[cum]+1; 306208122e43SStefano Zampini } 3063d62866d3SStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_vertices,&idxs);CHKERRQ(ierr); 306408122e43SStefano Zampini } 306508122e43SStefano Zampini 306608122e43SStefano Zampini if (mss) { /* multilevel */ 306708122e43SStefano Zampini ierr = MatSeqAIJGetArray(sub_schurs->sum_S_Ej_inv_all,&Sarray);CHKERRQ(ierr); 306808122e43SStefano Zampini ierr = MatSeqAIJGetArray(sub_schurs->sum_S_Ej_tilda_all,&Starray);CHKERRQ(ierr); 306908122e43SStefano Zampini } 307008122e43SStefano Zampini 3071ffd830a3SStefano Zampini thresh = pcbddc->adaptive_threshold; 307208122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 307308122e43SStefano Zampini const PetscInt *idxs; 30749d54b7f4SStefano Zampini PetscReal upper,lower; 3075862806e4SStefano Zampini PetscInt j,subset_size,eigs_start = 0; 307608122e43SStefano Zampini PetscBLASInt B_N; 3077aff50787SStefano Zampini PetscBool same_data = PETSC_FALSE; 307808122e43SStefano Zampini 30799d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) { 30809d54b7f4SStefano Zampini upper = PETSC_MAX_REAL; 30819d54b7f4SStefano Zampini lower = thresh; 30829d54b7f4SStefano Zampini } else { 30839d54b7f4SStefano Zampini upper = 1./thresh; 30849d54b7f4SStefano Zampini lower = 0.; 30859d54b7f4SStefano Zampini } 3086862806e4SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 3087ffd830a3SStefano Zampini ierr = ISGetIndices(sub_schurs->is_subs[i],&idxs);CHKERRQ(ierr); 3088f6f667cfSStefano Zampini ierr = PetscBLASIntCast(subset_size,&B_N);CHKERRQ(ierr); 3089f6f667cfSStefano Zampini if (allocated_S_St) { /* S and S_t should be copied since we could need them later */ 30909ab7bb16SStefano Zampini if (sub_schurs->is_hermitian) { 3091aff50787SStefano Zampini PetscInt j,k; 3092aff50787SStefano Zampini if (sub_schurs->n_subs == 1) { /* zeroing memory to use PetscMemcmp later */ 3093aff50787SStefano Zampini ierr = PetscMemzero(S,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 3094aff50787SStefano Zampini ierr = PetscMemzero(St,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 309508122e43SStefano Zampini } 309608122e43SStefano Zampini for (j=0;j<subset_size;j++) { 3097aff50787SStefano Zampini for (k=j;k<subset_size;k++) { 3098aff50787SStefano Zampini S [j*subset_size+k] = Sarray [cumarray+j*subset_size+k]; 3099aff50787SStefano Zampini St[j*subset_size+k] = Starray[cumarray+j*subset_size+k]; 3100aff50787SStefano Zampini } 310108122e43SStefano Zampini } 310208122e43SStefano Zampini } else { 310308122e43SStefano Zampini ierr = PetscMemcpy(S,Sarray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 310408122e43SStefano Zampini ierr = PetscMemcpy(St,Starray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 310508122e43SStefano Zampini } 31068bec7fa6SStefano Zampini } else { 3107f6f667cfSStefano Zampini S = Sarray + cumarray; 3108f6f667cfSStefano Zampini St = Starray + cumarray; 31098bec7fa6SStefano Zampini } 3110aff50787SStefano Zampini /* see if we can save some work */ 3111b7ab4a40SStefano Zampini if (sub_schurs->n_subs == 1 && pcbddc->use_deluxe_scaling) { 3112aff50787SStefano Zampini ierr = PetscMemcmp(S,St,subset_size*subset_size*sizeof(PetscScalar),&same_data);CHKERRQ(ierr); 3113aff50787SStefano Zampini } 3114aff50787SStefano Zampini 3115b7ab4a40SStefano Zampini if (same_data && !sub_schurs->change) { /* there's no need of constraints here */ 3116aff50787SStefano Zampini B_neigs = 0; 3117aff50787SStefano Zampini } else { 31189ab7bb16SStefano Zampini if (sub_schurs->is_hermitian && sub_schurs->is_posdef) { 311908122e43SStefano Zampini PetscBLASInt B_itype = 1; 3120f6f667cfSStefano Zampini PetscBLASInt B_IL, B_IU; 31214c6709b3SStefano Zampini PetscReal eps = -1.0; /* dlamch? */ 31229552c7c7SStefano Zampini PetscInt nmin_s; 3123b7ab4a40SStefano Zampini PetscBool compute_range = PETSC_FALSE; 312408122e43SStefano Zampini 3125fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3126eee23b56SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Computing for sub %d/%d size %d count %d fid %d.\n",i,sub_schurs->n_subs,subset_size,pcbddc->mat_graph->count[idxs[0]]+1,pcbddc->mat_graph->which_dof[idxs[0]]); 3127fd14bc51SStefano Zampini } 3128d16cbb6bSStefano Zampini 3129b7ab4a40SStefano Zampini compute_range = PETSC_FALSE; 3130b7ab4a40SStefano Zampini if (thresh > 1.+PETSC_SMALL && !same_data) { 3131b7ab4a40SStefano Zampini compute_range = PETSC_TRUE; 3132b7ab4a40SStefano Zampini } 3133b7ab4a40SStefano Zampini 313408122e43SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 3135b7ab4a40SStefano Zampini if (compute_range) { 3136d16cbb6bSStefano Zampini 3137d16cbb6bSStefano Zampini /* ask for eigenvalues larger than thresh */ 313808122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 31399d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 314008122e43SStefano Zampini #else 31419d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","V","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr)); 314208122e43SStefano Zampini #endif 3143b7ab4a40SStefano Zampini } else if (!same_data) { 3144d16cbb6bSStefano Zampini B_IU = PetscMax(1,PetscMin(B_N,nmax)); 3145d16cbb6bSStefano Zampini B_IL = 1; 3146d16cbb6bSStefano Zampini #if defined(PETSC_USE_COMPLEX) 31479d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 3148d16cbb6bSStefano Zampini #else 31499d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs,eigs,eigv,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr)); 3150d16cbb6bSStefano Zampini #endif 3151b03ebc13SStefano Zampini } else { /* same_data is true, so just get the adaptive functional requested by the user */ 3152b7ab4a40SStefano Zampini PetscInt k; 3153b7ab4a40SStefano Zampini if (!sub_schurs->change_primal_sub) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen"); 3154b7ab4a40SStefano Zampini ierr = ISGetLocalSize(sub_schurs->change_primal_sub[i],&nmax);CHKERRQ(ierr); 3155b7ab4a40SStefano Zampini ierr = PetscBLASIntCast(nmax,&B_neigs);CHKERRQ(ierr); 3156b7ab4a40SStefano Zampini nmin = nmax; 3157b7ab4a40SStefano Zampini ierr = PetscMemzero(eigv,subset_size*nmax*sizeof(PetscScalar));CHKERRQ(ierr); 3158b7ab4a40SStefano Zampini for (k=0;k<nmax;k++) { 3159b7ab4a40SStefano Zampini eigs[k] = 1./PETSC_SMALL; 3160b7ab4a40SStefano Zampini eigv[k*(subset_size+1)] = 1.0; 3161b7ab4a40SStefano Zampini } 3162d16cbb6bSStefano Zampini } 316308122e43SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 316408122e43SStefano Zampini if (B_ierr) { 31656c4ed002SBarry Smith if (B_ierr < 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: illegal value for argument %d",-(int)B_ierr); 31666c4ed002SBarry Smith else if (B_ierr <= B_N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: %d eigenvalues failed to converge",(int)B_ierr); 31676c4ed002SBarry Smith else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: leading minor of order %d is not positive definite",(int)B_ierr-B_N-1); 316808122e43SStefano Zampini } 316908122e43SStefano Zampini 317008122e43SStefano Zampini if (B_neigs > nmax) { 3171fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3172fd14bc51SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," found %d eigs, more than maximum required %d.\n",B_neigs,nmax); 3173fd14bc51SStefano Zampini } 31749d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) eigs_start = B_neigs -nmax; 317508122e43SStefano Zampini B_neigs = nmax; 317608122e43SStefano Zampini } 317708122e43SStefano Zampini 31789552c7c7SStefano Zampini nmin_s = PetscMin(nmin,B_N); 31799552c7c7SStefano Zampini if (B_neigs < nmin_s) { 318008122e43SStefano Zampini PetscBLASInt B_neigs2; 318108122e43SStefano Zampini 31829d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) { 3183f6f667cfSStefano Zampini B_IL = B_N - nmin_s + 1; 31849d54b7f4SStefano Zampini B_IU = B_N - B_neigs; 31859d54b7f4SStefano Zampini } else { 31869d54b7f4SStefano Zampini B_IL = B_neigs + 1; 31879d54b7f4SStefano Zampini B_IU = nmin_s; 31889d54b7f4SStefano Zampini } 3189fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3190fd14bc51SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," found %d eigs, less than minimum required %d. Asking for %d to %d incl (fortran like)\n",B_neigs,nmin,B_IL,B_IU); 3191fd14bc51SStefano Zampini } 31929ab7bb16SStefano Zampini if (sub_schurs->is_hermitian) { 31931ae86dd6SStefano Zampini PetscInt j,k; 319408122e43SStefano Zampini for (j=0;j<subset_size;j++) { 31951ae86dd6SStefano Zampini for (k=j;k<subset_size;k++) { 31961ae86dd6SStefano Zampini S [j*subset_size+k] = Sarray [cumarray+j*subset_size+k]; 31971ae86dd6SStefano Zampini St[j*subset_size+k] = Starray[cumarray+j*subset_size+k]; 319808122e43SStefano Zampini } 319908122e43SStefano Zampini } 320008122e43SStefano Zampini } else { 320108122e43SStefano Zampini ierr = PetscMemcpy(S,Sarray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 320208122e43SStefano Zampini ierr = PetscMemcpy(St,Starray+cumarray,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 320308122e43SStefano Zampini } 320408122e43SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 320508122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 32069d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs2,eigs+B_neigs,eigv+B_neigs*subset_size,&B_N,work,&B_lwork,rwork,B_iwork,B_ifail,&B_ierr)); 320708122e43SStefano Zampini #else 32089d54b7f4SStefano Zampini PetscStackCallBLAS("LAPACKsygvx",LAPACKsygvx_(&B_itype,"V","I","L",&B_N,St,&B_N,S,&B_N,&lower,&upper,&B_IL,&B_IU,&eps,&B_neigs2,eigs+B_neigs,eigv+B_neigs*subset_size,&B_N,work,&B_lwork,B_iwork,B_ifail,&B_ierr)); 320908122e43SStefano Zampini #endif 321008122e43SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 321108122e43SStefano Zampini B_neigs += B_neigs2; 321208122e43SStefano Zampini } 321308122e43SStefano Zampini if (B_ierr) { 32146c4ed002SBarry Smith if (B_ierr < 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: illegal value for argument %d",-(int)B_ierr); 32156c4ed002SBarry Smith else if (B_ierr <= B_N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: %d eigenvalues failed to converge",(int)B_ierr); 32166c4ed002SBarry Smith else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYGVX Lapack routine: leading minor of order %d is not positive definite",(int)B_ierr-B_N-1); 321708122e43SStefano Zampini } 3218fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3219ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," -> Got %d eigs\n",B_neigs);CHKERRQ(ierr); 322008122e43SStefano Zampini for (j=0;j<B_neigs;j++) { 322108122e43SStefano Zampini if (eigs[j] == 0.0) { 3222ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," Inf\n");CHKERRQ(ierr); 322308122e43SStefano Zampini } else { 32249d54b7f4SStefano Zampini if (pcbddc->use_deluxe_scaling) { 3225ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.6e\n",eigs[j+eigs_start]);CHKERRQ(ierr); 32269d54b7f4SStefano Zampini } else { 32279d54b7f4SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.6e\n",1./eigs[j+eigs_start]);CHKERRQ(ierr); 32289d54b7f4SStefano Zampini } 3229fd14bc51SStefano Zampini } 323008122e43SStefano Zampini } 323108122e43SStefano Zampini } 323208122e43SStefano Zampini } else { 323308122e43SStefano Zampini /* TODO */ 323408122e43SStefano Zampini } 3235aff50787SStefano Zampini } 32366c3e6151SStefano Zampini /* change the basis back to the original one */ 32376c3e6151SStefano Zampini if (sub_schurs->change) { 323872b8c272SStefano Zampini Mat change,phi,phit; 32396c3e6151SStefano Zampini 32406c3e6151SStefano Zampini if (pcbddc->dbg_flag > 1) { 32416c3e6151SStefano Zampini PetscInt ii; 32426c3e6151SStefano Zampini for (ii=0;ii<B_neigs;ii++) { 32436c3e6151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," -> Eigenvector (old basis) %d/%d (%d)\n",ii,B_neigs,B_N);CHKERRQ(ierr); 32446c3e6151SStefano Zampini for (j=0;j<B_N;j++) { 3245684229deSStefano Zampini #if defined(PETSC_USE_COMPLEX) 3246684229deSStefano Zampini PetscReal r = PetscRealPart(eigv[(ii+eigs_start)*subset_size+j]); 3247684229deSStefano Zampini PetscReal c = PetscImaginaryPart(eigv[(ii+eigs_start)*subset_size+j]); 3248684229deSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e + %1.4e i\n",r,c);CHKERRQ(ierr); 3249684229deSStefano Zampini #else 32506c3e6151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e\n",eigv[(ii+eigs_start)*subset_size+j]);CHKERRQ(ierr); 3251684229deSStefano Zampini #endif 32526c3e6151SStefano Zampini } 32536c3e6151SStefano Zampini } 32546c3e6151SStefano Zampini } 325572b8c272SStefano Zampini ierr = KSPGetOperators(sub_schurs->change[i],&change,NULL);CHKERRQ(ierr); 32566c3e6151SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,subset_size,B_neigs,eigv+eigs_start*subset_size,&phit);CHKERRQ(ierr); 325772b8c272SStefano Zampini ierr = MatMatMult(change,phit,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&phi);CHKERRQ(ierr); 32586c3e6151SStefano Zampini ierr = MatCopy(phi,phit,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 32596c3e6151SStefano Zampini ierr = MatDestroy(&phit);CHKERRQ(ierr); 32606c3e6151SStefano Zampini ierr = MatDestroy(&phi);CHKERRQ(ierr); 32616c3e6151SStefano Zampini } 32628bec7fa6SStefano Zampini maxneigs = PetscMax(B_neigs,maxneigs); 32638bec7fa6SStefano Zampini pcbddc->adaptive_constraints_n[i+nv] = B_neigs; 32649162d606SStefano Zampini if (B_neigs) { 32659162d606SStefano Zampini ierr = PetscMemcpy(pcbddc->adaptive_constraints_data+pcbddc->adaptive_constraints_data_ptr[cum],eigv+eigs_start*subset_size,B_neigs*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 3266fd14bc51SStefano Zampini 3267fd14bc51SStefano Zampini if (pcbddc->dbg_flag > 1) { 32689552c7c7SStefano Zampini PetscInt ii; 32699552c7c7SStefano Zampini for (ii=0;ii<B_neigs;ii++) { 3270ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," -> Eigenvector %d/%d (%d)\n",ii,B_neigs,B_N);CHKERRQ(ierr); 32719552c7c7SStefano Zampini for (j=0;j<B_N;j++) { 3272ac47001eSStefano Zampini #if defined(PETSC_USE_COMPLEX) 3273ac47001eSStefano Zampini PetscReal r = PetscRealPart(pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]); 3274ac47001eSStefano Zampini PetscReal c = PetscImaginaryPart(pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]); 3275ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e + %1.4e i\n",r,c);CHKERRQ(ierr); 3276ac47001eSStefano Zampini #else 3277ac47001eSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," %1.4e\n",pcbddc->adaptive_constraints_data[ii*subset_size+j+pcbddc->adaptive_constraints_data_ptr[cum]]);CHKERRQ(ierr); 3278ac47001eSStefano Zampini #endif 32799552c7c7SStefano Zampini } 32809552c7c7SStefano Zampini } 3281fd14bc51SStefano Zampini } 32829162d606SStefano Zampini ierr = PetscMemcpy(pcbddc->adaptive_constraints_idxs+pcbddc->adaptive_constraints_idxs_ptr[cum],idxs,subset_size*sizeof(PetscInt));CHKERRQ(ierr); 32839162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr[cum+1] = pcbddc->adaptive_constraints_idxs_ptr[cum] + subset_size; 32849162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr[cum+1] = pcbddc->adaptive_constraints_data_ptr[cum] + subset_size*B_neigs; 32859162d606SStefano Zampini cum++; 328608122e43SStefano Zampini } 328708122e43SStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_subs[i],&idxs);CHKERRQ(ierr); 328808122e43SStefano Zampini /* shift for next computation */ 328908122e43SStefano Zampini cumarray += subset_size*subset_size; 329008122e43SStefano Zampini } 3291fd14bc51SStefano Zampini if (pcbddc->dbg_flag) { 3292fd14bc51SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 3293fd14bc51SStefano Zampini } 329408122e43SStefano Zampini 329508122e43SStefano Zampini if (mss) { 329608122e43SStefano Zampini ierr = MatSeqAIJRestoreArray(sub_schurs->sum_S_Ej_inv_all,&Sarray);CHKERRQ(ierr); 329708122e43SStefano Zampini ierr = MatSeqAIJRestoreArray(sub_schurs->sum_S_Ej_tilda_all,&Starray);CHKERRQ(ierr); 3298f6f667cfSStefano Zampini /* destroy matrices (junk) */ 3299f6f667cfSStefano Zampini ierr = MatDestroy(&sub_schurs->sum_S_Ej_inv_all);CHKERRQ(ierr); 3300f6f667cfSStefano Zampini ierr = MatDestroy(&sub_schurs->sum_S_Ej_tilda_all);CHKERRQ(ierr); 330108122e43SStefano Zampini } 3302f6f667cfSStefano Zampini if (allocated_S_St) { 3303f6f667cfSStefano Zampini ierr = PetscFree2(S,St);CHKERRQ(ierr); 3304f6f667cfSStefano Zampini } 3305f6f667cfSStefano Zampini ierr = PetscFree5(eigv,eigs,work,B_iwork,B_ifail);CHKERRQ(ierr); 330608122e43SStefano Zampini #if defined(PETSC_USE_COMPLEX) 330708122e43SStefano Zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 330808122e43SStefano Zampini #endif 330908122e43SStefano Zampini if (pcbddc->dbg_flag) { 33101b968477SStefano Zampini PetscInt maxneigs_r; 3311b2566f29SBarry Smith ierr = MPIU_Allreduce(&maxneigs,&maxneigs_r,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 33129b28b941SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Maximum number of constraints per cc %d\n",maxneigs_r);CHKERRQ(ierr); 331308122e43SStefano Zampini } 331408122e43SStefano Zampini PetscFunctionReturn(0); 331508122e43SStefano Zampini } 3316b1b3d7a2SStefano Zampini 3317c8587f34SStefano Zampini PetscErrorCode PCBDDCSetUpSolvers(PC pc) 3318c8587f34SStefano Zampini { 33198629588bSStefano Zampini PetscScalar *coarse_submat_vals; 3320c8587f34SStefano Zampini PetscErrorCode ierr; 3321c8587f34SStefano Zampini 3322c8587f34SStefano Zampini PetscFunctionBegin; 3323f4ddd8eeSStefano Zampini /* Setup local scatters R_to_B and (optionally) R_to_D */ 33245e8657edSStefano Zampini /* PCBDDCSetUpLocalWorkVectors should be called first! */ 3325c8587f34SStefano Zampini ierr = PCBDDCSetUpLocalScatters(pc);CHKERRQ(ierr); 3326c8587f34SStefano Zampini 3327684f6988SStefano Zampini /* Setup local neumann solver ksp_R */ 33280fccc4e9SStefano Zampini /* PCBDDCSetUpLocalScatters should be called first! */ 3329684f6988SStefano Zampini ierr = PCBDDCSetUpLocalSolvers(pc,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 3330c8587f34SStefano Zampini 33318629588bSStefano Zampini /* 33328629588bSStefano Zampini Setup local correction and local part of coarse basis. 33338629588bSStefano Zampini Gives back the dense local part of the coarse matrix in column major ordering 33348629588bSStefano Zampini */ 333547f4ddc3SStefano Zampini ierr = PCBDDCSetUpCorrection(pc,&coarse_submat_vals);CHKERRQ(ierr); 33368629588bSStefano Zampini 33378629588bSStefano Zampini /* Compute total number of coarse nodes and setup coarse solver */ 33388629588bSStefano Zampini ierr = PCBDDCSetUpCoarseSolver(pc,coarse_submat_vals);CHKERRQ(ierr); 33398629588bSStefano Zampini 33408629588bSStefano Zampini /* free */ 33418629588bSStefano Zampini ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 3342c8587f34SStefano Zampini PetscFunctionReturn(0); 3343c8587f34SStefano Zampini } 3344c8587f34SStefano Zampini 3345674ae819SStefano Zampini PetscErrorCode PCBDDCResetCustomization(PC pc) 3346674ae819SStefano Zampini { 3347674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3348674ae819SStefano Zampini PetscErrorCode ierr; 3349674ae819SStefano Zampini 3350674ae819SStefano Zampini PetscFunctionBegin; 3351674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->user_primal_vertices);CHKERRQ(ierr); 335230368db7SStefano Zampini ierr = ISDestroy(&pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 3353674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 3354785d1243SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundariesLocal);CHKERRQ(ierr); 3355674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 3356f4ddd8eeSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->onearnullspace);CHKERRQ(ierr); 3357f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->onearnullvecs_state);CHKERRQ(ierr); 3358785d1243SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundariesLocal);CHKERRQ(ierr); 335963602bcaSStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,0,NULL);CHKERRQ(ierr); 336063602bcaSStefano Zampini ierr = PCBDDCSetDofsSplittingLocal(pc,0,NULL);CHKERRQ(ierr); 3361674ae819SStefano Zampini PetscFunctionReturn(0); 3362674ae819SStefano Zampini } 3363674ae819SStefano Zampini 3364674ae819SStefano Zampini PetscErrorCode PCBDDCResetTopography(PC pc) 3365674ae819SStefano Zampini { 3366674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 33674f1b2e48SStefano Zampini PetscInt i; 3368674ae819SStefano Zampini PetscErrorCode ierr; 3369674ae819SStefano Zampini 3370674ae819SStefano Zampini PetscFunctionBegin; 33711e0482f5SStefano Zampini ierr = MatDestroy(&pcbddc->nedcG);CHKERRQ(ierr); 33721e0482f5SStefano Zampini ierr = ISDestroy(&pcbddc->nedclocal);CHKERRQ(ierr); 3373a13144ffSStefano Zampini ierr = MatDestroy(&pcbddc->discretegradient);CHKERRQ(ierr); 3374b9b85e73SStefano Zampini ierr = MatDestroy(&pcbddc->user_ChangeOfBasisMatrix);CHKERRQ(ierr); 3375674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 337616909a7fSStefano Zampini ierr = MatDestroy(&pcbddc->switch_static_change);CHKERRQ(ierr); 33771dd7afcfSStefano Zampini ierr = VecDestroy(&pcbddc->work_change);CHKERRQ(ierr); 3378674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 3379669cc0f4SStefano Zampini ierr = MatDestroy(&pcbddc->divudotp);CHKERRQ(ierr); 3380fa23a32eSStefano Zampini ierr = ISDestroy(&pcbddc->divudotp_vl2l);CHKERRQ(ierr); 33819326c5c6Sstefano_zampini ierr = PCBDDCGraphDestroy(&pcbddc->mat_graph);CHKERRQ(ierr); 33824f1b2e48SStefano Zampini for (i=0;i<pcbddc->n_local_subs;i++) { 33834f1b2e48SStefano Zampini ierr = ISDestroy(&pcbddc->local_subs[i]);CHKERRQ(ierr); 33844f1b2e48SStefano Zampini } 3385e68a0315Sstefano_zampini pcbddc->n_local_subs = 0; 33864f1b2e48SStefano Zampini ierr = PetscFree(pcbddc->local_subs);CHKERRQ(ierr); 3387e68a0315Sstefano_zampini ierr = PCBDDCSubSchursDestroy(&pcbddc->sub_schurs);CHKERRQ(ierr); 3388c703fcc7SStefano Zampini pcbddc->graphanalyzed = PETSC_FALSE; 33898af8fcf9SStefano Zampini pcbddc->recompute_topography = PETSC_TRUE; 3390674ae819SStefano Zampini PetscFunctionReturn(0); 3391674ae819SStefano Zampini } 3392674ae819SStefano Zampini 3393674ae819SStefano Zampini PetscErrorCode PCBDDCResetSolvers(PC pc) 3394674ae819SStefano Zampini { 3395674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3396674ae819SStefano Zampini PetscErrorCode ierr; 3397674ae819SStefano Zampini 3398674ae819SStefano Zampini PetscFunctionBegin; 3399674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 340058da7f69SStefano Zampini if (pcbddc->coarse_phi_B) { 3401ca92afb2SStefano Zampini PetscScalar *array; 340206656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&array);CHKERRQ(ierr); 340306656605SStefano Zampini ierr = PetscFree(array);CHKERRQ(ierr); 340458da7f69SStefano Zampini } 3405674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 3406674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 340715aaf578SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_B);CHKERRQ(ierr); 340815aaf578SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_D);CHKERRQ(ierr); 3409674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 3410674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 3411674ae819SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 341206656605SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 3413674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 3414674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 34158ce42a96SStefano Zampini ierr = ISDestroy(&pcbddc->is_R_local);CHKERRQ(ierr); 3416674ae819SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 3417674ae819SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 3418674ae819SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 34199326c5c6Sstefano_zampini ierr = KSPReset(pcbddc->ksp_D);CHKERRQ(ierr); 34209326c5c6Sstefano_zampini ierr = KSPReset(pcbddc->ksp_R);CHKERRQ(ierr); 34219326c5c6Sstefano_zampini ierr = KSPReset(pcbddc->coarse_ksp);CHKERRQ(ierr); 3422f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 3423727cdba6SStefano Zampini ierr = PetscFree(pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 34240e6343abSStefano Zampini ierr = PetscFree2(pcbddc->local_primal_ref_node,pcbddc->local_primal_ref_mult);CHKERRQ(ierr); 3425f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->global_primal_indices);CHKERRQ(ierr); 342670cf5478SStefano Zampini ierr = ISDestroy(&pcbddc->coarse_subassembling);CHKERRQ(ierr); 342781d14e9dSStefano Zampini ierr = MatDestroy(&pcbddc->benign_change);CHKERRQ(ierr); 34280369aaf7SStefano Zampini ierr = VecDestroy(&pcbddc->benign_vec);CHKERRQ(ierr); 34291dd7afcfSStefano Zampini ierr = PCBDDCBenignShellMat(pc,PETSC_TRUE);CHKERRQ(ierr); 34304f1b2e48SStefano Zampini ierr = MatDestroy(&pcbddc->benign_B0);CHKERRQ(ierr); 34318b9f24d4SStefano Zampini ierr = PetscSFDestroy(&pcbddc->benign_sf);CHKERRQ(ierr); 3432ca92afb2SStefano Zampini if (pcbddc->benign_zerodiag_subs) { 3433ca92afb2SStefano Zampini PetscInt i; 3434ca92afb2SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 3435ca92afb2SStefano Zampini ierr = ISDestroy(&pcbddc->benign_zerodiag_subs[i]);CHKERRQ(ierr); 3436ca92afb2SStefano Zampini } 3437ca92afb2SStefano Zampini ierr = PetscFree(pcbddc->benign_zerodiag_subs);CHKERRQ(ierr); 3438ca92afb2SStefano Zampini } 34394f1b2e48SStefano Zampini ierr = PetscFree3(pcbddc->benign_p0_lidx,pcbddc->benign_p0_gidx,pcbddc->benign_p0);CHKERRQ(ierr); 3440674ae819SStefano Zampini PetscFunctionReturn(0); 3441674ae819SStefano Zampini } 3442674ae819SStefano Zampini 3443f4ddd8eeSStefano Zampini PetscErrorCode PCBDDCSetUpLocalWorkVectors(PC pc) 34446bfb1811SStefano Zampini { 34456bfb1811SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 34466bfb1811SStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 34476bfb1811SStefano Zampini VecType impVecType; 34484f1b2e48SStefano Zampini PetscInt n_constraints,n_R,old_size; 34496bfb1811SStefano Zampini PetscErrorCode ierr; 34506bfb1811SStefano Zampini 34516bfb1811SStefano Zampini PetscFunctionBegin; 34524f1b2e48SStefano Zampini n_constraints = pcbddc->local_primal_size - pcbddc->benign_n - pcbddc->n_vertices; 3453b371cd4fSStefano Zampini n_R = pcis->n - pcbddc->n_vertices; 34546bfb1811SStefano Zampini ierr = VecGetType(pcis->vec1_N,&impVecType);CHKERRQ(ierr); 3455e7b262bdSStefano Zampini /* local work vectors (try to avoid unneeded work)*/ 3456e7b262bdSStefano Zampini /* R nodes */ 3457e7b262bdSStefano Zampini old_size = -1; 3458e7b262bdSStefano Zampini if (pcbddc->vec1_R) { 3459e7b262bdSStefano Zampini ierr = VecGetSize(pcbddc->vec1_R,&old_size);CHKERRQ(ierr); 3460e7b262bdSStefano Zampini } 3461e7b262bdSStefano Zampini if (n_R != old_size) { 3462e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 3463e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 34646bfb1811SStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_R);CHKERRQ(ierr); 34656bfb1811SStefano Zampini ierr = VecSetSizes(pcbddc->vec1_R,PETSC_DECIDE,n_R);CHKERRQ(ierr); 34666bfb1811SStefano Zampini ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 34676bfb1811SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 3468e7b262bdSStefano Zampini } 3469e7b262bdSStefano Zampini /* local primal dofs */ 3470e7b262bdSStefano Zampini old_size = -1; 3471e7b262bdSStefano Zampini if (pcbddc->vec1_P) { 3472e7b262bdSStefano Zampini ierr = VecGetSize(pcbddc->vec1_P,&old_size);CHKERRQ(ierr); 3473e7b262bdSStefano Zampini } 3474e9189074SStefano Zampini if (pcbddc->local_primal_size != old_size) { 3475e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 347683b7ccabSStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_P);CHKERRQ(ierr); 3477e9189074SStefano Zampini ierr = VecSetSizes(pcbddc->vec1_P,PETSC_DECIDE,pcbddc->local_primal_size);CHKERRQ(ierr); 34786bfb1811SStefano Zampini ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 3479e7b262bdSStefano Zampini } 3480e7b262bdSStefano Zampini /* local explicit constraints */ 3481e7b262bdSStefano Zampini old_size = -1; 3482e7b262bdSStefano Zampini if (pcbddc->vec1_C) { 3483e7b262bdSStefano Zampini ierr = VecGetSize(pcbddc->vec1_C,&old_size);CHKERRQ(ierr); 3484e7b262bdSStefano Zampini } 3485e7b262bdSStefano Zampini if (n_constraints && n_constraints != old_size) { 3486e7b262bdSStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 348783b7ccabSStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pcis->vec1_N),&pcbddc->vec1_C);CHKERRQ(ierr); 348883b7ccabSStefano Zampini ierr = VecSetSizes(pcbddc->vec1_C,PETSC_DECIDE,n_constraints);CHKERRQ(ierr); 348983b7ccabSStefano Zampini ierr = VecSetType(pcbddc->vec1_C,impVecType);CHKERRQ(ierr); 349083b7ccabSStefano Zampini } 34916bfb1811SStefano Zampini PetscFunctionReturn(0); 34926bfb1811SStefano Zampini } 34936bfb1811SStefano Zampini 349447f4ddc3SStefano Zampini PetscErrorCode PCBDDCSetUpCorrection(PC pc, PetscScalar **coarse_submat_vals_n) 349588ebb749SStefano Zampini { 349625084f0cSStefano Zampini PetscErrorCode ierr; 349725084f0cSStefano Zampini /* pointers to pcis and pcbddc */ 349888ebb749SStefano Zampini PC_IS* pcis = (PC_IS*)pc->data; 349988ebb749SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 3500d62866d3SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 350125084f0cSStefano Zampini /* submatrices of local problem */ 350280677318SStefano Zampini Mat A_RV,A_VR,A_VV,local_auxmat2_R; 350306656605SStefano Zampini /* submatrices of local coarse problem */ 350406656605SStefano Zampini Mat S_VV,S_CV,S_VC,S_CC; 350525084f0cSStefano Zampini /* working matrices */ 350606656605SStefano Zampini Mat C_CR; 350725084f0cSStefano Zampini /* additional working stuff */ 350806656605SStefano Zampini PC pc_R; 3509c58f9fdbSStefano Zampini Mat F,Brhs = NULL; 35105cbda25cSStefano Zampini Vec dummy_vec; 3511c58f9fdbSStefano Zampini PetscBool isLU,isCHOL,isILU,need_benign_correction,sparserhs; 351225084f0cSStefano Zampini PetscScalar *coarse_submat_vals; /* TODO: use a PETSc matrix */ 351306656605SStefano Zampini PetscScalar *work; 351406656605SStefano Zampini PetscInt *idx_V_B; 3515ffd830a3SStefano Zampini PetscInt lda_rhs,n,n_vertices,n_constraints,*p0_lidx_I; 351606656605SStefano Zampini PetscInt i,n_R,n_D,n_B; 3517ffd830a3SStefano Zampini 351825084f0cSStefano Zampini /* some shortcuts to scalars */ 351906656605SStefano Zampini PetscScalar one=1.0,m_one=-1.0; 352088ebb749SStefano Zampini 352188ebb749SStefano Zampini PetscFunctionBegin; 35229a962809SStefano Zampini if (!pcbddc->symmetric_primal && pcbddc->benign_n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Non-symmetric primal basis computation with benign trick not yet implemented"); 3523ffd830a3SStefano Zampini 3524ffd830a3SStefano Zampini /* Set Non-overlapping dimensions */ 3525b371cd4fSStefano Zampini n_vertices = pcbddc->n_vertices; 35264f1b2e48SStefano Zampini n_constraints = pcbddc->local_primal_size - pcbddc->benign_n - n_vertices; 3527b371cd4fSStefano Zampini n_B = pcis->n_B; 3528b371cd4fSStefano Zampini n_D = pcis->n - n_B; 352988ebb749SStefano Zampini n_R = pcis->n - n_vertices; 353088ebb749SStefano Zampini 353188ebb749SStefano Zampini /* vertices in boundary numbering */ 3532785e854fSJed Brown ierr = PetscMalloc1(n_vertices,&idx_V_B);CHKERRQ(ierr); 35330e6343abSStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,n_vertices,pcbddc->local_primal_ref_node,&i,idx_V_B);CHKERRQ(ierr); 35346c4ed002SBarry Smith if (i != n_vertices) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for BDDC vertices! %D != %D\n",n_vertices,i); 353588ebb749SStefano Zampini 353606656605SStefano Zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 3537019a44ceSStefano Zampini ierr = PetscCalloc1(pcbddc->local_primal_size*pcbddc->local_primal_size,&coarse_submat_vals);CHKERRQ(ierr); 353806656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_vertices,n_vertices,coarse_submat_vals,&S_VV);CHKERRQ(ierr); 353906656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_VV,pcbddc->local_primal_size);CHKERRQ(ierr); 354006656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_constraints,n_vertices,coarse_submat_vals+n_vertices,&S_CV);CHKERRQ(ierr); 354106656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_CV,pcbddc->local_primal_size);CHKERRQ(ierr); 354206656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_vertices,n_constraints,coarse_submat_vals+pcbddc->local_primal_size*n_vertices,&S_VC);CHKERRQ(ierr); 354306656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_VC,pcbddc->local_primal_size);CHKERRQ(ierr); 354406656605SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_constraints,n_constraints,coarse_submat_vals+(pcbddc->local_primal_size+1)*n_vertices,&S_CC);CHKERRQ(ierr); 354506656605SStefano Zampini ierr = MatSeqDenseSetLDA(S_CC,pcbddc->local_primal_size);CHKERRQ(ierr); 354606656605SStefano Zampini 354706656605SStefano Zampini /* determine if can use MatSolve routines instead of calling KSPSolve on ksp_R */ 354806656605SStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_R);CHKERRQ(ierr); 354906656605SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCLU,&isLU);CHKERRQ(ierr); 355006656605SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCILU,&isILU);CHKERRQ(ierr); 355106656605SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_R,PCCHOLESKY,&isCHOL);CHKERRQ(ierr); 3552ffd830a3SStefano Zampini lda_rhs = n_R; 3553a3df083aSStefano Zampini need_benign_correction = PETSC_FALSE; 355406656605SStefano Zampini if (isLU || isILU || isCHOL) { 355506656605SStefano Zampini ierr = PCFactorGetMatrix(pc_R,&F);CHKERRQ(ierr); 3556b334f244SStefano Zampini } else if (sub_schurs && sub_schurs->reuse_solver) { 3557df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3558d62866d3SStefano Zampini MatFactorType type; 3559d62866d3SStefano Zampini 3560df4d28bfSStefano Zampini F = reuse_solver->F; 35616816873aSStefano Zampini ierr = MatGetFactorType(F,&type);CHKERRQ(ierr); 3562d62866d3SStefano Zampini if (type == MAT_FACTOR_CHOLESKY) isCHOL = PETSC_TRUE; 3563ffd830a3SStefano Zampini ierr = MatGetSize(F,&lda_rhs,NULL);CHKERRQ(ierr); 356422db5ddcSStefano Zampini need_benign_correction = (PetscBool)(!!reuse_solver->benign_n); 356506656605SStefano Zampini } else { 356606656605SStefano Zampini F = NULL; 356706656605SStefano Zampini } 356806656605SStefano Zampini 3569c58f9fdbSStefano Zampini /* determine if we can use a sparse right-hand side */ 3570c58f9fdbSStefano Zampini sparserhs = PETSC_FALSE; 3571c58f9fdbSStefano Zampini if (F) { 3572c58f9fdbSStefano Zampini const MatSolverPackage solver; 3573c58f9fdbSStefano Zampini 3574c58f9fdbSStefano Zampini ierr = MatFactorGetSolverPackage(F,&solver);CHKERRQ(ierr); 3575c58f9fdbSStefano Zampini ierr = PetscStrcmp(solver,MATSOLVERMUMPS,&sparserhs);CHKERRQ(ierr); 3576c58f9fdbSStefano Zampini } 3577c58f9fdbSStefano Zampini 3578ffd830a3SStefano Zampini /* allocate workspace */ 3579ffd830a3SStefano Zampini n = 0; 3580ffd830a3SStefano Zampini if (n_constraints) { 3581ffd830a3SStefano Zampini n += lda_rhs*n_constraints; 3582ffd830a3SStefano Zampini } 3583ffd830a3SStefano Zampini if (n_vertices) { 3584ffd830a3SStefano Zampini n = PetscMax(2*lda_rhs*n_vertices,n); 3585ffd830a3SStefano Zampini n = PetscMax((lda_rhs+n_B)*n_vertices,n); 3586ffd830a3SStefano Zampini } 35872a3a6641Sstefano_zampini if (!pcbddc->symmetric_primal) { 35882a3a6641Sstefano_zampini n = PetscMax(2*lda_rhs*pcbddc->local_primal_size,n); 35892a3a6641Sstefano_zampini } 3590ffd830a3SStefano Zampini ierr = PetscMalloc1(n,&work);CHKERRQ(ierr); 3591ffd830a3SStefano Zampini 35925cbda25cSStefano Zampini /* create dummy vector to modify rhs and sol of MatMatSolve (work array will never be used) */ 35935cbda25cSStefano Zampini dummy_vec = NULL; 35945cbda25cSStefano Zampini if (need_benign_correction && lda_rhs != n_R && F) { 35955cbda25cSStefano Zampini ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lda_rhs,work,&dummy_vec);CHKERRQ(ierr); 35965cbda25cSStefano Zampini } 35975cbda25cSStefano Zampini 359888ebb749SStefano Zampini /* Precompute stuffs needed for preprocessing and application of BDDC*/ 359988ebb749SStefano Zampini if (n_constraints) { 360072b8c272SStefano Zampini Mat M1,M2,M3,C_B; 360106656605SStefano Zampini IS is_aux; 360280677318SStefano Zampini PetscScalar *array,*array2; 360306656605SStefano Zampini 3604f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 360580677318SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 360688ebb749SStefano Zampini 360725084f0cSStefano Zampini /* Extract constraints on R nodes: C_{CR} */ 360825084f0cSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_aux);CHKERRQ(ierr); 36097dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_aux,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 36107dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_aux,pcis->is_B_local,MAT_INITIAL_MATRIX,&C_B);CHKERRQ(ierr); 361188ebb749SStefano Zampini 361280677318SStefano Zampini /* Assemble local_auxmat2_R = (- A_{RR}^{-1} C^T_{CR}) needed by BDDC setup */ 361380677318SStefano Zampini /* Assemble pcbddc->local_auxmat2 = R_to_B (- A_{RR}^{-1} C^T_{CR}) needed by BDDC application */ 3614c58f9fdbSStefano Zampini if (!sparserhs) { 3615ffd830a3SStefano Zampini ierr = PetscMemzero(work,lda_rhs*n_constraints*sizeof(PetscScalar));CHKERRQ(ierr); 361688ebb749SStefano Zampini for (i=0;i<n_constraints;i++) { 361706656605SStefano Zampini const PetscScalar *row_cmat_values; 361806656605SStefano Zampini const PetscInt *row_cmat_indices; 361906656605SStefano Zampini PetscInt size_of_constraint,j; 362088ebb749SStefano Zampini 362106656605SStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,&row_cmat_indices,&row_cmat_values);CHKERRQ(ierr); 362206656605SStefano Zampini for (j=0;j<size_of_constraint;j++) { 3623ffd830a3SStefano Zampini work[row_cmat_indices[j]+i*lda_rhs] = -row_cmat_values[j]; 362406656605SStefano Zampini } 362506656605SStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,&row_cmat_indices,&row_cmat_values);CHKERRQ(ierr); 362606656605SStefano Zampini } 3627c58f9fdbSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,work,&Brhs);CHKERRQ(ierr); 3628c58f9fdbSStefano Zampini } else { 3629c58f9fdbSStefano Zampini Mat tC_CR; 3630c58f9fdbSStefano Zampini 3631c58f9fdbSStefano Zampini ierr = MatScale(C_CR,-1.0);CHKERRQ(ierr); 3632c58f9fdbSStefano Zampini if (lda_rhs != n_R) { 3633c58f9fdbSStefano Zampini PetscScalar *aa; 3634c58f9fdbSStefano Zampini PetscInt r,*ii,*jj; 3635c58f9fdbSStefano Zampini PetscBool done; 3636c58f9fdbSStefano Zampini 3637c58f9fdbSStefano Zampini ierr = MatGetRowIJ(C_CR,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 3638c58f9fdbSStefano Zampini if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"GetRowIJ failed");CHKERRQ(ierr); 3639c58f9fdbSStefano Zampini ierr = MatSeqAIJGetArray(C_CR,&aa);CHKERRQ(ierr); 3640c58f9fdbSStefano Zampini ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,n_constraints,lda_rhs,ii,jj,aa,&tC_CR);CHKERRQ(ierr); 3641c58f9fdbSStefano Zampini ierr = MatRestoreRowIJ(C_CR,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 3642c58f9fdbSStefano Zampini if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"RestoreRowIJ failed");CHKERRQ(ierr); 3643c58f9fdbSStefano Zampini } else { 3644c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)C_CR);CHKERRQ(ierr); 3645c58f9fdbSStefano Zampini tC_CR = C_CR; 3646c58f9fdbSStefano Zampini } 3647c58f9fdbSStefano Zampini ierr = MatCreateTranspose(tC_CR,&Brhs);CHKERRQ(ierr); 3648c58f9fdbSStefano Zampini ierr = MatDestroy(&tC_CR);CHKERRQ(ierr); 3649c58f9fdbSStefano Zampini } 3650ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,NULL,&local_auxmat2_R);CHKERRQ(ierr); 365106656605SStefano Zampini if (F) { 3652a3df083aSStefano Zampini if (need_benign_correction) { 3653df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3654a3df083aSStefano Zampini 365572b8c272SStefano Zampini /* rhs is already zero on interior dofs, no need to change the rhs */ 365672b8c272SStefano Zampini ierr = PetscMemzero(reuse_solver->benign_save_vals,pcbddc->benign_n*sizeof(PetscScalar));CHKERRQ(ierr); 3657a3df083aSStefano Zampini } 3658c58f9fdbSStefano Zampini ierr = MatMatSolve(F,Brhs,local_auxmat2_R);CHKERRQ(ierr); 3659a3df083aSStefano Zampini if (need_benign_correction) { 3660a3df083aSStefano Zampini PetscScalar *marr; 3661df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3662a3df083aSStefano Zampini 3663a3df083aSStefano Zampini ierr = MatDenseGetArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 36645cbda25cSStefano Zampini if (lda_rhs != n_R) { 36655cbda25cSStefano Zampini for (i=0;i<n_constraints;i++) { 36665cbda25cSStefano Zampini ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr); 36675cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 36685cbda25cSStefano Zampini ierr = VecResetArray(dummy_vec);CHKERRQ(ierr); 36695cbda25cSStefano Zampini } 36705cbda25cSStefano Zampini } else { 3671a3df083aSStefano Zampini for (i=0;i<n_constraints;i++) { 3672a3df083aSStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr); 36735cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 3674a3df083aSStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 3675a3df083aSStefano Zampini } 36765cbda25cSStefano Zampini } 3677a3df083aSStefano Zampini ierr = MatDenseRestoreArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 3678a3df083aSStefano Zampini } 367906656605SStefano Zampini } else { 368080677318SStefano Zampini PetscScalar *marr; 368180677318SStefano Zampini 368280677318SStefano Zampini ierr = MatDenseGetArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 368306656605SStefano Zampini for (i=0;i<n_constraints;i++) { 3684ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+i*lda_rhs);CHKERRQ(ierr); 3685ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,marr+i*lda_rhs);CHKERRQ(ierr); 368606656605SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 368706656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 368806656605SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 368906656605SStefano Zampini } 369080677318SStefano Zampini ierr = MatDenseRestoreArray(local_auxmat2_R,&marr);CHKERRQ(ierr); 369106656605SStefano Zampini } 3692c58f9fdbSStefano Zampini if (sparserhs) { 3693c58f9fdbSStefano Zampini ierr = MatScale(C_CR,-1.0);CHKERRQ(ierr); 3694c58f9fdbSStefano Zampini } 3695c58f9fdbSStefano Zampini ierr = MatDestroy(&Brhs);CHKERRQ(ierr); 369680677318SStefano Zampini if (!pcbddc->switch_static) { 369780677318SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,n_constraints,NULL,&pcbddc->local_auxmat2);CHKERRQ(ierr); 369880677318SStefano Zampini ierr = MatDenseGetArray(pcbddc->local_auxmat2,&array);CHKERRQ(ierr); 369980677318SStefano Zampini ierr = MatDenseGetArray(local_auxmat2_R,&array2);CHKERRQ(ierr); 370080677318SStefano Zampini for (i=0;i<n_constraints;i++) { 3701ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,array2+i*lda_rhs);CHKERRQ(ierr); 370280677318SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,array+i*n_B);CHKERRQ(ierr); 370380677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 370480677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 370580677318SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 370680677318SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 370780677318SStefano Zampini } 370880677318SStefano Zampini ierr = MatDenseRestoreArray(local_auxmat2_R,&array2);CHKERRQ(ierr); 370980677318SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->local_auxmat2,&array);CHKERRQ(ierr); 371072b8c272SStefano Zampini ierr = MatMatMult(C_B,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&M3);CHKERRQ(ierr); 371180677318SStefano Zampini } else { 3712ffd830a3SStefano Zampini if (lda_rhs != n_R) { 3713ffd830a3SStefano Zampini IS dummy; 3714ffd830a3SStefano Zampini 3715ffd830a3SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_R,0,1,&dummy);CHKERRQ(ierr); 37167dae84e0SHong Zhang ierr = MatCreateSubMatrix(local_auxmat2_R,dummy,NULL,MAT_INITIAL_MATRIX,&pcbddc->local_auxmat2);CHKERRQ(ierr); 3717ffd830a3SStefano Zampini ierr = ISDestroy(&dummy);CHKERRQ(ierr); 3718ffd830a3SStefano Zampini } else { 371980677318SStefano Zampini ierr = PetscObjectReference((PetscObject)local_auxmat2_R);CHKERRQ(ierr); 372080677318SStefano Zampini pcbddc->local_auxmat2 = local_auxmat2_R; 3721ffd830a3SStefano Zampini } 372225084f0cSStefano Zampini ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&M3);CHKERRQ(ierr); 372380677318SStefano Zampini } 372480677318SStefano Zampini ierr = ISDestroy(&is_aux);CHKERRQ(ierr); 372580677318SStefano Zampini /* Assemble explicitly S_CC = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 372680677318SStefano Zampini ierr = MatScale(M3,m_one);CHKERRQ(ierr); 372706656605SStefano Zampini ierr = MatDuplicate(M3,MAT_DO_NOT_COPY_VALUES,&M1);CHKERRQ(ierr); 372806656605SStefano Zampini ierr = MatDuplicate(M3,MAT_DO_NOT_COPY_VALUES,&M2);CHKERRQ(ierr); 372980677318SStefano Zampini if (isCHOL) { 373080677318SStefano Zampini ierr = MatCholeskyFactor(M3,NULL,NULL);CHKERRQ(ierr); 373180677318SStefano Zampini } else { 373225084f0cSStefano Zampini ierr = MatLUFactor(M3,NULL,NULL,NULL);CHKERRQ(ierr); 373380677318SStefano Zampini } 373480677318SStefano Zampini ierr = VecSet(pcbddc->vec1_C,one);CHKERRQ(ierr); 373506656605SStefano Zampini ierr = MatDiagonalSet(M2,pcbddc->vec1_C,INSERT_VALUES);CHKERRQ(ierr); 373625084f0cSStefano Zampini ierr = MatMatSolve(M3,M2,M1);CHKERRQ(ierr); 373725084f0cSStefano Zampini ierr = MatDestroy(&M2);CHKERRQ(ierr); 373825084f0cSStefano Zampini ierr = MatDestroy(&M3);CHKERRQ(ierr); 373980677318SStefano Zampini /* Assemble local_auxmat1 = S_CC*C_{CB} needed by BDDC application in KSP and in preproc */ 374072b8c272SStefano Zampini ierr = MatMatMult(M1,C_B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 374172b8c272SStefano Zampini ierr = MatDestroy(&C_B);CHKERRQ(ierr); 374206656605SStefano Zampini ierr = MatCopy(M1,S_CC,SAME_NONZERO_PATTERN);CHKERRQ(ierr); /* S_CC can have a different LDA, MatMatSolve doesn't support it */ 374306656605SStefano Zampini ierr = MatDestroy(&M1);CHKERRQ(ierr); 3744f4ddd8eeSStefano Zampini } 3745fc227af8SStefano Zampini 3746fc227af8SStefano Zampini /* Get submatrices from subdomain matrix */ 374788ebb749SStefano Zampini if (n_vertices) { 374806656605SStefano Zampini IS is_aux; 3749c58f9fdbSStefano Zampini PetscBool isseqaij; 37503a50541eSStefano Zampini 3751b334f244SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { /* is_R_local is not sorted, ISComplement doesn't like it */ 37526816873aSStefano Zampini IS tis; 37536816873aSStefano Zampini 37546816873aSStefano Zampini ierr = ISDuplicate(pcbddc->is_R_local,&tis);CHKERRQ(ierr); 37556816873aSStefano Zampini ierr = ISSort(tis);CHKERRQ(ierr); 37566816873aSStefano Zampini ierr = ISComplement(tis,0,pcis->n,&is_aux);CHKERRQ(ierr); 37576816873aSStefano Zampini ierr = ISDestroy(&tis);CHKERRQ(ierr); 37586816873aSStefano Zampini } else { 37593a50541eSStefano Zampini ierr = ISComplement(pcbddc->is_R_local,0,pcis->n,&is_aux);CHKERRQ(ierr); 37606816873aSStefano Zampini } 37617dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,is_aux,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 37627dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,is_aux,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 3763c58f9fdbSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A_VR,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 3764c58f9fdbSStefano Zampini if (!isseqaij) { /* MatMatMult(A_VR,A_RRmA_RV) below will raise an error */ 3765c58f9fdbSStefano Zampini ierr = MatConvert(A_VR,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_VR);CHKERRQ(ierr); 3766c58f9fdbSStefano Zampini } 37677dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,is_aux,is_aux,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 376825084f0cSStefano Zampini ierr = ISDestroy(&is_aux);CHKERRQ(ierr); 376988ebb749SStefano Zampini } 377088ebb749SStefano Zampini 377188ebb749SStefano Zampini /* Matrix of coarse basis functions (local) */ 3772f4ddd8eeSStefano Zampini if (pcbddc->coarse_phi_B) { 377306656605SStefano Zampini PetscInt on_B,on_primal,on_D=n_D; 377406656605SStefano Zampini if (pcbddc->coarse_phi_D) { 377506656605SStefano Zampini ierr = MatGetSize(pcbddc->coarse_phi_D,&on_D,NULL);CHKERRQ(ierr); 377606656605SStefano Zampini } 3777f4ddd8eeSStefano Zampini ierr = MatGetSize(pcbddc->coarse_phi_B,&on_B,&on_primal);CHKERRQ(ierr); 377806656605SStefano Zampini if (on_B != n_B || on_primal != pcbddc->local_primal_size || on_D != n_D) { 377906656605SStefano Zampini PetscScalar *marray; 378006656605SStefano Zampini 378106656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&marray);CHKERRQ(ierr); 378206656605SStefano Zampini ierr = PetscFree(marray);CHKERRQ(ierr); 3783f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 3784f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_B);CHKERRQ(ierr); 3785f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 3786f4ddd8eeSStefano Zampini ierr = MatDestroy(&pcbddc->coarse_psi_D);CHKERRQ(ierr); 3787f4ddd8eeSStefano Zampini } 3788f4ddd8eeSStefano Zampini } 378906656605SStefano Zampini 3790f4ddd8eeSStefano Zampini if (!pcbddc->coarse_phi_B) { 3791a6e023c1Sstefano_zampini PetscScalar *marr; 379288ebb749SStefano Zampini 3793a6e023c1Sstefano_zampini /* memory size */ 379406656605SStefano Zampini n = n_B*pcbddc->local_primal_size; 3795a6e023c1Sstefano_zampini if (pcbddc->switch_static || pcbddc->dbg_flag) n += n_D*pcbddc->local_primal_size; 3796a6e023c1Sstefano_zampini if (!pcbddc->symmetric_primal) n *= 2; 3797a6e023c1Sstefano_zampini ierr = PetscCalloc1(n,&marr);CHKERRQ(ierr); 3798a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,pcbddc->local_primal_size,marr,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 3799a6e023c1Sstefano_zampini marr += n_B*pcbddc->local_primal_size; 38008eeda7d8SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 3801a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_D,pcbddc->local_primal_size,marr,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 3802a6e023c1Sstefano_zampini marr += n_D*pcbddc->local_primal_size; 380388ebb749SStefano Zampini } 38043301b35fSStefano Zampini if (!pcbddc->symmetric_primal) { 3805a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,pcbddc->local_primal_size,marr,&pcbddc->coarse_psi_B);CHKERRQ(ierr); 3806a6e023c1Sstefano_zampini marr += n_B*pcbddc->local_primal_size; 38078eeda7d8SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 3808a6e023c1Sstefano_zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_D,pcbddc->local_primal_size,marr,&pcbddc->coarse_psi_D);CHKERRQ(ierr); 380988ebb749SStefano Zampini } 381088ebb749SStefano Zampini } else { 3811c0553b1fSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->coarse_phi_B);CHKERRQ(ierr); 3812c0553b1fSStefano Zampini pcbddc->coarse_psi_B = pcbddc->coarse_phi_B; 38131b968477SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 3814c0553b1fSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->coarse_phi_D);CHKERRQ(ierr); 3815c0553b1fSStefano Zampini pcbddc->coarse_psi_D = pcbddc->coarse_phi_D; 3816c0553b1fSStefano Zampini } 381788ebb749SStefano Zampini } 381806656605SStefano Zampini } 3819019a44ceSStefano Zampini 382006656605SStefano Zampini /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 38214f1b2e48SStefano Zampini p0_lidx_I = NULL; 38224f1b2e48SStefano Zampini if (pcbddc->benign_n && (pcbddc->switch_static || pcbddc->dbg_flag)) { 3823d12edf2fSStefano Zampini const PetscInt *idxs; 3824d12edf2fSStefano Zampini 3825d12edf2fSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,&idxs);CHKERRQ(ierr); 38264f1b2e48SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&p0_lidx_I);CHKERRQ(ierr); 38274f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 38284f1b2e48SStefano Zampini ierr = PetscFindInt(pcbddc->benign_p0_lidx[i],pcis->n-pcis->n_B,idxs,&p0_lidx_I[i]);CHKERRQ(ierr); 38294f1b2e48SStefano Zampini } 3830d12edf2fSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,&idxs);CHKERRQ(ierr); 3831d12edf2fSStefano Zampini } 3832d16cbb6bSStefano Zampini 383306656605SStefano Zampini /* vertices */ 383406656605SStefano Zampini if (n_vertices) { 3835c58f9fdbSStefano Zampini PetscBool restoreavr = PETSC_FALSE; 383616f15bc4SStefano Zampini 3837af25d912SStefano Zampini ierr = MatConvert(A_VV,MATDENSE,MAT_INPLACE_MATRIX,&A_VV);CHKERRQ(ierr); 383804708bb6SStefano Zampini 383916f15bc4SStefano Zampini if (n_R) { 384014393ed6SStefano Zampini Mat A_RRmA_RV,A_RV_bcorr=NULL,S_VVt; /* S_VVt with LDA=N */ 384106656605SStefano Zampini PetscBLASInt B_N,B_one = 1; 384216f15bc4SStefano Zampini PetscScalar *x,*y; 384306656605SStefano Zampini 384421eccb56SStefano Zampini ierr = MatScale(A_RV,m_one);CHKERRQ(ierr); 384514393ed6SStefano Zampini if (need_benign_correction) { 384614393ed6SStefano Zampini ISLocalToGlobalMapping RtoN; 384714393ed6SStefano Zampini IS is_p0; 384814393ed6SStefano Zampini PetscInt *idxs_p0,n; 384914393ed6SStefano Zampini 385014393ed6SStefano Zampini ierr = PetscMalloc1(pcbddc->benign_n,&idxs_p0);CHKERRQ(ierr); 385114393ed6SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(pcbddc->is_R_local,&RtoN);CHKERRQ(ierr); 385214393ed6SStefano Zampini ierr = ISGlobalToLocalMappingApply(RtoN,IS_GTOLM_DROP,pcbddc->benign_n,pcbddc->benign_p0_lidx,&n,idxs_p0);CHKERRQ(ierr); 3853af25d912SStefano Zampini if (n != pcbddc->benign_n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in R numbering for benign p0! %d != %d\n",n,pcbddc->benign_n); 385414393ed6SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&RtoN);CHKERRQ(ierr); 385514393ed6SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n,idxs_p0,PETSC_OWN_POINTER,&is_p0);CHKERRQ(ierr); 38567dae84e0SHong Zhang ierr = MatCreateSubMatrix(A_RV,is_p0,NULL,MAT_INITIAL_MATRIX,&A_RV_bcorr);CHKERRQ(ierr); 385714393ed6SStefano Zampini ierr = ISDestroy(&is_p0);CHKERRQ(ierr); 385814393ed6SStefano Zampini } 385914393ed6SStefano Zampini 3860c58f9fdbSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,work,&A_RRmA_RV);CHKERRQ(ierr); 3861c58f9fdbSStefano Zampini if (!sparserhs || need_benign_correction) { 3862ffd830a3SStefano Zampini if (lda_rhs == n_R) { 3863af25d912SStefano Zampini ierr = MatConvert(A_RV,MATDENSE,MAT_INPLACE_MATRIX,&A_RV);CHKERRQ(ierr); 3864ffd830a3SStefano Zampini } else { 3865ca92afb2SStefano Zampini PetscScalar *av,*array; 3866ca92afb2SStefano Zampini const PetscInt *xadj,*adjncy; 3867ca92afb2SStefano Zampini PetscInt n; 3868ca92afb2SStefano Zampini PetscBool flg_row; 3869ffd830a3SStefano Zampini 3870ca92afb2SStefano Zampini array = work+lda_rhs*n_vertices; 3871ca92afb2SStefano Zampini ierr = PetscMemzero(array,lda_rhs*n_vertices*sizeof(PetscScalar));CHKERRQ(ierr); 38729d54b7f4SStefano Zampini ierr = MatConvert(A_RV,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_RV);CHKERRQ(ierr); 3873ca92afb2SStefano Zampini ierr = MatGetRowIJ(A_RV,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 3874ca92afb2SStefano Zampini ierr = MatSeqAIJGetArray(A_RV,&av);CHKERRQ(ierr); 3875ca92afb2SStefano Zampini for (i=0;i<n;i++) { 3876ca92afb2SStefano Zampini PetscInt j; 3877ca92afb2SStefano Zampini for (j=xadj[i];j<xadj[i+1];j++) array[lda_rhs*adjncy[j]+i] = av[j]; 3878ffd830a3SStefano Zampini } 3879ca92afb2SStefano Zampini ierr = MatRestoreRowIJ(A_RV,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 3880ca92afb2SStefano Zampini ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 3881ca92afb2SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,array,&A_RV);CHKERRQ(ierr); 3882ffd830a3SStefano Zampini } 3883a3df083aSStefano Zampini if (need_benign_correction) { 3884df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3885a3df083aSStefano Zampini PetscScalar *marr; 3886a3df083aSStefano Zampini 3887a3df083aSStefano Zampini ierr = MatDenseGetArray(A_RV,&marr);CHKERRQ(ierr); 388814393ed6SStefano Zampini /* need \Phi^T A_RV = (I+L)A_RV, L given by 388914393ed6SStefano Zampini 389014393ed6SStefano Zampini | 0 0 0 | (V) 389114393ed6SStefano Zampini L = | 0 0 -1 | (P-p0) 389214393ed6SStefano Zampini | 0 0 -1 | (p0) 389314393ed6SStefano Zampini 389414393ed6SStefano Zampini */ 3895df4d28bfSStefano Zampini for (i=0;i<reuse_solver->benign_n;i++) { 389614393ed6SStefano Zampini const PetscScalar *vals; 389714393ed6SStefano Zampini const PetscInt *idxs,*idxs_zero; 389814393ed6SStefano Zampini PetscInt n,j,nz; 389914393ed6SStefano Zampini 3900df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 3901df4d28bfSStefano Zampini ierr = ISGetIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 390214393ed6SStefano Zampini ierr = MatGetRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 390314393ed6SStefano Zampini for (j=0;j<n;j++) { 390414393ed6SStefano Zampini PetscScalar val = vals[j]; 390514393ed6SStefano Zampini PetscInt k,col = idxs[j]; 390614393ed6SStefano Zampini for (k=0;k<nz;k++) marr[idxs_zero[k]+lda_rhs*col] -= val; 390714393ed6SStefano Zampini } 390814393ed6SStefano Zampini ierr = MatRestoreRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 3909df4d28bfSStefano Zampini ierr = ISRestoreIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 391014393ed6SStefano Zampini } 391172b8c272SStefano Zampini ierr = MatDenseRestoreArray(A_RV,&marr);CHKERRQ(ierr); 391272b8c272SStefano Zampini } 3913c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)A_RV);CHKERRQ(ierr); 3914c58f9fdbSStefano Zampini Brhs = A_RV; 3915c58f9fdbSStefano Zampini } else { 3916c58f9fdbSStefano Zampini Mat tA_RVT,A_RVT; 3917c58f9fdbSStefano Zampini 3918c58f9fdbSStefano Zampini if (!pcbddc->symmetric_primal) { 3919c58f9fdbSStefano Zampini ierr = MatTranspose(A_RV,MAT_INITIAL_MATRIX,&A_RVT);CHKERRQ(ierr); 3920c58f9fdbSStefano Zampini } else { 3921c58f9fdbSStefano Zampini restoreavr = PETSC_TRUE; 3922c58f9fdbSStefano Zampini ierr = MatScale(A_VR,-1.0);CHKERRQ(ierr); 3923c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)A_VR);CHKERRQ(ierr); 3924c58f9fdbSStefano Zampini A_RVT = A_VR; 3925c58f9fdbSStefano Zampini } 3926c58f9fdbSStefano Zampini if (lda_rhs != n_R) { 3927c58f9fdbSStefano Zampini PetscScalar *aa; 3928c58f9fdbSStefano Zampini PetscInt r,*ii,*jj; 3929c58f9fdbSStefano Zampini PetscBool done; 3930c58f9fdbSStefano Zampini 3931c58f9fdbSStefano Zampini ierr = MatGetRowIJ(A_RVT,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 3932c58f9fdbSStefano Zampini if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"GetRowIJ failed");CHKERRQ(ierr); 3933c58f9fdbSStefano Zampini ierr = MatSeqAIJGetArray(A_RVT,&aa);CHKERRQ(ierr); 3934c58f9fdbSStefano Zampini ierr = MatCreateSeqAIJWithArrays(PETSC_COMM_SELF,n_vertices,lda_rhs,ii,jj,aa,&tA_RVT);CHKERRQ(ierr); 3935c58f9fdbSStefano Zampini ierr = MatRestoreRowIJ(A_RVT,0,PETSC_FALSE,PETSC_FALSE,&r,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 3936c58f9fdbSStefano Zampini if (!done) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"RestoreRowIJ failed");CHKERRQ(ierr); 3937c58f9fdbSStefano Zampini } else { 3938c58f9fdbSStefano Zampini ierr = PetscObjectReference((PetscObject)A_RVT);CHKERRQ(ierr); 3939c58f9fdbSStefano Zampini tA_RVT = A_RVT; 3940c58f9fdbSStefano Zampini } 3941c58f9fdbSStefano Zampini ierr = MatCreateTranspose(tA_RVT,&Brhs);CHKERRQ(ierr); 3942c58f9fdbSStefano Zampini ierr = MatDestroy(&tA_RVT);CHKERRQ(ierr); 3943c58f9fdbSStefano Zampini ierr = MatDestroy(&A_RVT);CHKERRQ(ierr); 3944c58f9fdbSStefano Zampini } 394572b8c272SStefano Zampini if (F) { 394614393ed6SStefano Zampini /* need to correct the rhs */ 394772b8c272SStefano Zampini if (need_benign_correction) { 394872b8c272SStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 394972b8c272SStefano Zampini PetscScalar *marr; 395072b8c272SStefano Zampini 3951c58f9fdbSStefano Zampini ierr = MatDenseGetArray(Brhs,&marr);CHKERRQ(ierr); 39525cbda25cSStefano Zampini if (lda_rhs != n_R) { 39535cbda25cSStefano Zampini for (i=0;i<n_vertices;i++) { 39545cbda25cSStefano Zampini ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr); 39555cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 39565cbda25cSStefano Zampini ierr = VecResetArray(dummy_vec);CHKERRQ(ierr); 39575cbda25cSStefano Zampini } 39585cbda25cSStefano Zampini } else { 3959a3df083aSStefano Zampini for (i=0;i<n_vertices;i++) { 3960a3df083aSStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr); 39615cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 3962a3df083aSStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 3963a3df083aSStefano Zampini } 39645cbda25cSStefano Zampini } 3965c58f9fdbSStefano Zampini ierr = MatDenseRestoreArray(Brhs,&marr);CHKERRQ(ierr); 3966a3df083aSStefano Zampini } 3967c58f9fdbSStefano Zampini ierr = MatMatSolve(F,Brhs,A_RRmA_RV);CHKERRQ(ierr); 3968c58f9fdbSStefano Zampini if (restoreavr) { 3969c58f9fdbSStefano Zampini ierr = MatScale(A_VR,-1.0);CHKERRQ(ierr); 3970c58f9fdbSStefano Zampini } 397114393ed6SStefano Zampini /* need to correct the solution */ 3972a3df083aSStefano Zampini if (need_benign_correction) { 3973df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 3974a3df083aSStefano Zampini PetscScalar *marr; 3975a3df083aSStefano Zampini 3976a3df083aSStefano Zampini ierr = MatDenseGetArray(A_RRmA_RV,&marr);CHKERRQ(ierr); 39775cbda25cSStefano Zampini if (lda_rhs != n_R) { 39785cbda25cSStefano Zampini for (i=0;i<n_vertices;i++) { 39795cbda25cSStefano Zampini ierr = VecPlaceArray(dummy_vec,marr+i*lda_rhs);CHKERRQ(ierr); 39805cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,dummy_vec,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 39815cbda25cSStefano Zampini ierr = VecResetArray(dummy_vec);CHKERRQ(ierr); 39825cbda25cSStefano Zampini } 39835cbda25cSStefano Zampini } else { 3984a3df083aSStefano Zampini for (i=0;i<n_vertices;i++) { 3985a3df083aSStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marr+i*lda_rhs);CHKERRQ(ierr); 39865cbda25cSStefano Zampini ierr = PCBDDCReuseSolversBenignAdapt(reuse_solver,pcbddc->vec1_R,NULL,PETSC_TRUE,PETSC_TRUE);CHKERRQ(ierr); 3987a3df083aSStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 3988a3df083aSStefano Zampini } 39895cbda25cSStefano Zampini } 3990a3df083aSStefano Zampini ierr = MatDenseRestoreArray(A_RRmA_RV,&marr);CHKERRQ(ierr); 3991a3df083aSStefano Zampini } 399206656605SStefano Zampini } else { 3993c58f9fdbSStefano Zampini ierr = MatDenseGetArray(Brhs,&y);CHKERRQ(ierr); 399406656605SStefano Zampini for (i=0;i<n_vertices;i++) { 3995ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,y+i*lda_rhs);CHKERRQ(ierr); 3996ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,work+i*lda_rhs);CHKERRQ(ierr); 399706656605SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 399806656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 399906656605SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 400006656605SStefano Zampini } 4001c58f9fdbSStefano Zampini ierr = MatDenseRestoreArray(Brhs,&y);CHKERRQ(ierr); 400206656605SStefano Zampini } 400380677318SStefano Zampini ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 4004c58f9fdbSStefano Zampini ierr = MatDestroy(&Brhs);CHKERRQ(ierr); 4005ffd830a3SStefano Zampini /* S_VV and S_CV */ 400606656605SStefano Zampini if (n_constraints) { 400706656605SStefano Zampini Mat B; 400880677318SStefano Zampini 4009ffd830a3SStefano Zampini ierr = PetscMemzero(work+lda_rhs*n_vertices,n_B*n_vertices*sizeof(PetscScalar));CHKERRQ(ierr); 401080677318SStefano Zampini for (i=0;i<n_vertices;i++) { 4011ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+i*lda_rhs);CHKERRQ(ierr); 4012ffd830a3SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,work+lda_rhs*n_vertices+i*n_B);CHKERRQ(ierr); 401380677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 401480677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 401580677318SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 401680677318SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 401780677318SStefano Zampini } 4018ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_B,n_vertices,work+lda_rhs*n_vertices,&B);CHKERRQ(ierr); 401980677318SStefano Zampini ierr = MatMatMult(pcbddc->local_auxmat1,B,MAT_REUSE_MATRIX,PETSC_DEFAULT,&S_CV);CHKERRQ(ierr); 402080677318SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 4021ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_vertices,work+lda_rhs*n_vertices,&B);CHKERRQ(ierr); 402280677318SStefano Zampini ierr = MatMatMult(local_auxmat2_R,S_CV,MAT_REUSE_MATRIX,PETSC_DEFAULT,&B);CHKERRQ(ierr); 402306656605SStefano Zampini ierr = MatScale(S_CV,m_one);CHKERRQ(ierr); 4024ffd830a3SStefano Zampini ierr = PetscBLASIntCast(lda_rhs*n_vertices,&B_N);CHKERRQ(ierr); 4025ffd830a3SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&B_N,&one,work+lda_rhs*n_vertices,&B_one,work,&B_one)); 402606656605SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 402706656605SStefano Zampini } 4028ffd830a3SStefano Zampini if (lda_rhs != n_R) { 4029ffd830a3SStefano Zampini ierr = MatDestroy(&A_RRmA_RV);CHKERRQ(ierr); 4030ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_vertices,work,&A_RRmA_RV);CHKERRQ(ierr); 4031ffd830a3SStefano Zampini ierr = MatSeqDenseSetLDA(A_RRmA_RV,lda_rhs);CHKERRQ(ierr); 4032ffd830a3SStefano Zampini } 403306656605SStefano Zampini ierr = MatMatMult(A_VR,A_RRmA_RV,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&S_VVt);CHKERRQ(ierr); 403414393ed6SStefano Zampini /* need A_VR * \Phi * A_RRmA_RV = A_VR * (I+L)^T * A_RRmA_RV, L given as before */ 403514393ed6SStefano Zampini if (need_benign_correction) { 4036df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 403714393ed6SStefano Zampini PetscScalar *marr,*sums; 403814393ed6SStefano Zampini 403914393ed6SStefano Zampini ierr = PetscMalloc1(n_vertices,&sums);CHKERRQ(ierr); 4040f913dca9SStefano Zampini ierr = MatDenseGetArray(S_VVt,&marr);CHKERRQ(ierr); 4041df4d28bfSStefano Zampini for (i=0;i<reuse_solver->benign_n;i++) { 404214393ed6SStefano Zampini const PetscScalar *vals; 404314393ed6SStefano Zampini const PetscInt *idxs,*idxs_zero; 404414393ed6SStefano Zampini PetscInt n,j,nz; 404514393ed6SStefano Zampini 4046df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->benign_zerodiag_subs[i],&nz);CHKERRQ(ierr); 4047df4d28bfSStefano Zampini ierr = ISGetIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 404814393ed6SStefano Zampini for (j=0;j<n_vertices;j++) { 404914393ed6SStefano Zampini PetscInt k; 405014393ed6SStefano Zampini sums[j] = 0.; 405114393ed6SStefano Zampini for (k=0;k<nz;k++) sums[j] += work[idxs_zero[k]+j*lda_rhs]; 405214393ed6SStefano Zampini } 405314393ed6SStefano Zampini ierr = MatGetRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 405414393ed6SStefano Zampini for (j=0;j<n;j++) { 405514393ed6SStefano Zampini PetscScalar val = vals[j]; 405614393ed6SStefano Zampini PetscInt k; 405714393ed6SStefano Zampini for (k=0;k<n_vertices;k++) { 405814393ed6SStefano Zampini marr[idxs[j]+k*n_vertices] += val*sums[k]; 405914393ed6SStefano Zampini } 406014393ed6SStefano Zampini } 406114393ed6SStefano Zampini ierr = MatRestoreRow(A_RV_bcorr,i,&n,&idxs,&vals);CHKERRQ(ierr); 4062df4d28bfSStefano Zampini ierr = ISRestoreIndices(reuse_solver->benign_zerodiag_subs[i],&idxs_zero);CHKERRQ(ierr); 406314393ed6SStefano Zampini } 406414393ed6SStefano Zampini ierr = PetscFree(sums);CHKERRQ(ierr); 4065f913dca9SStefano Zampini ierr = MatDenseRestoreArray(S_VVt,&marr);CHKERRQ(ierr); 406614393ed6SStefano Zampini ierr = MatDestroy(&A_RV_bcorr);CHKERRQ(ierr); 406714393ed6SStefano Zampini } 406880677318SStefano Zampini ierr = MatDestroy(&A_RRmA_RV);CHKERRQ(ierr); 406906656605SStefano Zampini ierr = PetscBLASIntCast(n_vertices*n_vertices,&B_N);CHKERRQ(ierr); 407006656605SStefano Zampini ierr = MatDenseGetArray(A_VV,&x);CHKERRQ(ierr); 407106656605SStefano Zampini ierr = MatDenseGetArray(S_VVt,&y);CHKERRQ(ierr); 407206656605SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&B_N,&one,x,&B_one,y,&B_one)); 407306656605SStefano Zampini ierr = MatDenseRestoreArray(A_VV,&x);CHKERRQ(ierr); 407406656605SStefano Zampini ierr = MatDenseRestoreArray(S_VVt,&y);CHKERRQ(ierr); 407506656605SStefano Zampini ierr = MatCopy(S_VVt,S_VV,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 4076d16cbb6bSStefano Zampini ierr = MatDestroy(&S_VVt);CHKERRQ(ierr); 4077019a44ceSStefano Zampini } else { 4078d16cbb6bSStefano Zampini ierr = MatCopy(A_VV,S_VV,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 4079d16cbb6bSStefano Zampini } 408021eccb56SStefano Zampini ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 4081d16cbb6bSStefano Zampini 408206656605SStefano Zampini /* coarse basis functions */ 408306656605SStefano Zampini for (i=0;i<n_vertices;i++) { 408416f15bc4SStefano Zampini PetscScalar *y; 408516f15bc4SStefano Zampini 4086ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+lda_rhs*i);CHKERRQ(ierr); 408706656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 408806656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,y+n_B*i);CHKERRQ(ierr); 408906656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 409006656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 409106656605SStefano Zampini y[n_B*i+idx_V_B[i]] = 1.0; 409206656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 409306656605SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 409406656605SStefano Zampini 409506656605SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 40964f1b2e48SStefano Zampini PetscInt j; 40974f1b2e48SStefano Zampini 409806656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 409906656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_D,y+n_D*i);CHKERRQ(ierr); 410006656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 410106656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 410206656605SStefano Zampini ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr); 41034f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) y[n_D*i+p0_lidx_I[j]] = 0.0; 410406656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 410506656605SStefano Zampini } 410606656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 410706656605SStefano Zampini } 410804708bb6SStefano Zampini /* if n_R == 0 the object is not destroyed */ 410904708bb6SStefano Zampini ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 411006656605SStefano Zampini } 41115cbda25cSStefano Zampini ierr = VecDestroy(&dummy_vec);CHKERRQ(ierr); 411206656605SStefano Zampini 411306656605SStefano Zampini if (n_constraints) { 411406656605SStefano Zampini Mat B; 411506656605SStefano Zampini 4116ffd830a3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,lda_rhs,n_constraints,work,&B);CHKERRQ(ierr); 411706656605SStefano Zampini ierr = MatScale(S_CC,m_one);CHKERRQ(ierr); 411880677318SStefano Zampini ierr = MatMatMult(local_auxmat2_R,S_CC,MAT_REUSE_MATRIX,PETSC_DEFAULT,&B);CHKERRQ(ierr); 411906656605SStefano Zampini ierr = MatScale(S_CC,m_one);CHKERRQ(ierr); 412006656605SStefano Zampini if (n_vertices) { 412180677318SStefano Zampini if (isCHOL) { /* if we can solve the interior problem with cholesky, we should also be fine with transposing here */ 412280677318SStefano Zampini ierr = MatTranspose(S_CV,MAT_REUSE_MATRIX,&S_VC);CHKERRQ(ierr); 412380677318SStefano Zampini } else { 412480677318SStefano Zampini Mat S_VCt; 412580677318SStefano Zampini 4126ffd830a3SStefano Zampini if (lda_rhs != n_R) { 4127ffd830a3SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 412872b8c272SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_constraints,work,&B);CHKERRQ(ierr); 4129ffd830a3SStefano Zampini ierr = MatSeqDenseSetLDA(B,lda_rhs);CHKERRQ(ierr); 4130ffd830a3SStefano Zampini } 413180677318SStefano Zampini ierr = MatMatMult(A_VR,B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&S_VCt);CHKERRQ(ierr); 413280677318SStefano Zampini ierr = MatCopy(S_VCt,S_VC,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 413380677318SStefano Zampini ierr = MatDestroy(&S_VCt);CHKERRQ(ierr); 413480677318SStefano Zampini } 413506656605SStefano Zampini } 413606656605SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 413706656605SStefano Zampini /* coarse basis functions */ 413806656605SStefano Zampini for (i=0;i<n_constraints;i++) { 413906656605SStefano Zampini PetscScalar *y; 414006656605SStefano Zampini 4141ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+lda_rhs*i);CHKERRQ(ierr); 414206656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 414306656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,y+n_B*(i+n_vertices));CHKERRQ(ierr); 414406656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 414506656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 414606656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&y);CHKERRQ(ierr); 414706656605SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 414806656605SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 41494f1b2e48SStefano Zampini PetscInt j; 41504f1b2e48SStefano Zampini 415106656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 415206656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_D,y+n_D*(i+n_vertices));CHKERRQ(ierr); 415306656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 415406656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 415506656605SStefano Zampini ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr); 41564f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) y[n_D*i+p0_lidx_I[j]] = 0.0; 415706656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_D,&y);CHKERRQ(ierr); 415806656605SStefano Zampini } 415906656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 416006656605SStefano Zampini } 416106656605SStefano Zampini } 416280677318SStefano Zampini if (n_constraints) { 416380677318SStefano Zampini ierr = MatDestroy(&local_auxmat2_R);CHKERRQ(ierr); 416480677318SStefano Zampini } 41654f1b2e48SStefano Zampini ierr = PetscFree(p0_lidx_I);CHKERRQ(ierr); 416672b8c272SStefano Zampini 416772b8c272SStefano Zampini /* coarse matrix entries relative to B_0 */ 416872b8c272SStefano Zampini if (pcbddc->benign_n) { 416972b8c272SStefano Zampini Mat B0_B,B0_BPHI; 417072b8c272SStefano Zampini IS is_dummy; 417172b8c272SStefano Zampini PetscScalar *data; 417272b8c272SStefano Zampini PetscInt j; 417372b8c272SStefano Zampini 417472b8c272SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr); 41757dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->benign_B0,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr); 417672b8c272SStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 417772b8c272SStefano Zampini ierr = MatMatMult(B0_B,pcbddc->coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&B0_BPHI);CHKERRQ(ierr); 417886c38910SStefano Zampini ierr = MatConvert(B0_BPHI,MATSEQDENSE,MAT_INPLACE_MATRIX,&B0_BPHI);CHKERRQ(ierr); 417972b8c272SStefano Zampini ierr = MatDenseGetArray(B0_BPHI,&data);CHKERRQ(ierr); 418072b8c272SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) { 418172b8c272SStefano Zampini PetscInt primal_idx = pcbddc->local_primal_size - pcbddc->benign_n + j; 418272b8c272SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 418372b8c272SStefano Zampini coarse_submat_vals[primal_idx*pcbddc->local_primal_size+i] = data[i*pcbddc->benign_n+j]; 418472b8c272SStefano Zampini coarse_submat_vals[i*pcbddc->local_primal_size+primal_idx] = data[i*pcbddc->benign_n+j]; 418572b8c272SStefano Zampini } 418672b8c272SStefano Zampini } 418772b8c272SStefano Zampini ierr = MatDenseRestoreArray(B0_BPHI,&data);CHKERRQ(ierr); 418872b8c272SStefano Zampini ierr = MatDestroy(&B0_B);CHKERRQ(ierr); 418972b8c272SStefano Zampini ierr = MatDestroy(&B0_BPHI);CHKERRQ(ierr); 419072b8c272SStefano Zampini } 4191019a44ceSStefano Zampini 419206656605SStefano Zampini /* compute other basis functions for non-symmetric problems */ 41933301b35fSStefano Zampini if (!pcbddc->symmetric_primal) { 4194ffd830a3SStefano Zampini Mat B_V=NULL,B_C=NULL; 4195ffd830a3SStefano Zampini PetscScalar *marray; 419606656605SStefano Zampini 419706656605SStefano Zampini if (n_constraints) { 4198ffd830a3SStefano Zampini Mat S_CCT,C_CRT; 419906656605SStefano Zampini 4200abc8f43dSstefano_zampini ierr = MatTranspose(C_CR,MAT_INITIAL_MATRIX,&C_CRT);CHKERRQ(ierr); 420106656605SStefano Zampini ierr = MatTranspose(S_CC,MAT_INITIAL_MATRIX,&S_CCT);CHKERRQ(ierr); 4202ffd830a3SStefano Zampini ierr = MatMatMult(C_CRT,S_CCT,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&B_C);CHKERRQ(ierr); 420316f15bc4SStefano Zampini ierr = MatDestroy(&S_CCT);CHKERRQ(ierr); 420406656605SStefano Zampini if (n_vertices) { 4205ffd830a3SStefano Zampini Mat S_VCT; 420606656605SStefano Zampini 420706656605SStefano Zampini ierr = MatTranspose(S_VC,MAT_INITIAL_MATRIX,&S_VCT);CHKERRQ(ierr); 4208ffd830a3SStefano Zampini ierr = MatMatMult(C_CRT,S_VCT,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&B_V);CHKERRQ(ierr); 420916f15bc4SStefano Zampini ierr = MatDestroy(&S_VCT);CHKERRQ(ierr); 421006656605SStefano Zampini } 4211ffd830a3SStefano Zampini ierr = MatDestroy(&C_CRT);CHKERRQ(ierr); 42125b782168SStefano Zampini } else { 42135b782168SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,n_R,n_vertices,NULL,&B_V);CHKERRQ(ierr); 421406656605SStefano Zampini } 421516f15bc4SStefano Zampini if (n_vertices && n_R) { 4216ffd830a3SStefano Zampini PetscScalar *av,*marray; 4217ffd830a3SStefano Zampini const PetscInt *xadj,*adjncy; 4218ffd830a3SStefano Zampini PetscInt n; 4219ffd830a3SStefano Zampini PetscBool flg_row; 422006656605SStefano Zampini 4221ffd830a3SStefano Zampini /* B_V = B_V - A_VR^T */ 4222af25d912SStefano Zampini ierr = MatConvert(A_VR,MATSEQAIJ,MAT_INPLACE_MATRIX,&A_VR);CHKERRQ(ierr); 4223ffd830a3SStefano Zampini ierr = MatGetRowIJ(A_VR,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 4224ffd830a3SStefano Zampini ierr = MatSeqAIJGetArray(A_VR,&av);CHKERRQ(ierr); 4225ffd830a3SStefano Zampini ierr = MatDenseGetArray(B_V,&marray);CHKERRQ(ierr); 4226ffd830a3SStefano Zampini for (i=0;i<n;i++) { 4227ffd830a3SStefano Zampini PetscInt j; 4228ffd830a3SStefano Zampini for (j=xadj[i];j<xadj[i+1];j++) marray[i*n_R + adjncy[j]] -= av[j]; 4229ffd830a3SStefano Zampini } 4230ffd830a3SStefano Zampini ierr = MatDenseRestoreArray(B_V,&marray);CHKERRQ(ierr); 4231ffd830a3SStefano Zampini ierr = MatRestoreRowIJ(A_VR,0,PETSC_FALSE,PETSC_FALSE,&n,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 4232ffd830a3SStefano Zampini ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 423306656605SStefano Zampini } 423406656605SStefano Zampini 4235ffd830a3SStefano Zampini /* currently there's no support for MatTransposeMatSolve(F,B,X) */ 4236abc8f43dSstefano_zampini if (n_vertices) { 4237ffd830a3SStefano Zampini ierr = MatDenseGetArray(B_V,&marray);CHKERRQ(ierr); 4238ffd830a3SStefano Zampini for (i=0;i<n_vertices;i++) { 4239ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marray+i*n_R);CHKERRQ(ierr); 4240ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,work+i*n_R);CHKERRQ(ierr); 424106656605SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 424206656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 424306656605SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 424406656605SStefano Zampini } 4245ffd830a3SStefano Zampini ierr = MatDenseRestoreArray(B_V,&marray);CHKERRQ(ierr); 4246abc8f43dSstefano_zampini } 42475b782168SStefano Zampini if (B_C) { 4248ffd830a3SStefano Zampini ierr = MatDenseGetArray(B_C,&marray);CHKERRQ(ierr); 4249ffd830a3SStefano Zampini for (i=n_vertices;i<n_constraints+n_vertices;i++) { 4250ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,marray+(i-n_vertices)*n_R);CHKERRQ(ierr); 4251ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec2_R,work+i*n_R);CHKERRQ(ierr); 4252ffd830a3SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 4253ffd830a3SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 4254ffd830a3SStefano Zampini ierr = VecResetArray(pcbddc->vec2_R);CHKERRQ(ierr); 425506656605SStefano Zampini } 4256ffd830a3SStefano Zampini ierr = MatDenseRestoreArray(B_C,&marray);CHKERRQ(ierr); 42575b782168SStefano Zampini } 425806656605SStefano Zampini /* coarse basis functions */ 425906656605SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 426006656605SStefano Zampini PetscScalar *y; 426106656605SStefano Zampini 4262ffd830a3SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_R,work+i*n_R);CHKERRQ(ierr); 426306656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_psi_B,&y);CHKERRQ(ierr); 426406656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_B,y+n_B*i);CHKERRQ(ierr); 426506656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 426606656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 426706656605SStefano Zampini if (i<n_vertices) { 426806656605SStefano Zampini y[n_B*i+idx_V_B[i]] = 1.0; 426906656605SStefano Zampini } 427006656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_psi_B,&y);CHKERRQ(ierr); 427106656605SStefano Zampini ierr = VecResetArray(pcis->vec1_B);CHKERRQ(ierr); 427206656605SStefano Zampini 427306656605SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 427406656605SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_psi_D,&y);CHKERRQ(ierr); 427506656605SStefano Zampini ierr = VecPlaceArray(pcis->vec1_D,y+n_D*i);CHKERRQ(ierr); 427606656605SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 427706656605SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 427806656605SStefano Zampini ierr = VecResetArray(pcis->vec1_D);CHKERRQ(ierr); 427906656605SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_psi_D,&y);CHKERRQ(ierr); 428006656605SStefano Zampini } 428106656605SStefano Zampini ierr = VecResetArray(pcbddc->vec1_R);CHKERRQ(ierr); 428206656605SStefano Zampini } 4283ffd830a3SStefano Zampini ierr = MatDestroy(&B_V);CHKERRQ(ierr); 4284ffd830a3SStefano Zampini ierr = MatDestroy(&B_C);CHKERRQ(ierr); 428506656605SStefano Zampini } 4286a6e023c1Sstefano_zampini 4287d62866d3SStefano Zampini /* free memory */ 428888ebb749SStefano Zampini ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 428906656605SStefano Zampini ierr = MatDestroy(&S_VV);CHKERRQ(ierr); 429006656605SStefano Zampini ierr = MatDestroy(&S_CV);CHKERRQ(ierr); 429106656605SStefano Zampini ierr = MatDestroy(&S_VC);CHKERRQ(ierr); 429206656605SStefano Zampini ierr = MatDestroy(&S_CC);CHKERRQ(ierr); 4293d62866d3SStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 4294d62866d3SStefano Zampini if (n_vertices) { 4295d62866d3SStefano Zampini ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 4296d62866d3SStefano Zampini } 4297d62866d3SStefano Zampini if (n_constraints) { 4298d62866d3SStefano Zampini ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 4299d62866d3SStefano Zampini } 430088ebb749SStefano Zampini /* Checking coarse_sub_mat and coarse basis functios */ 430188ebb749SStefano Zampini /* Symmetric case : It should be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 430288ebb749SStefano Zampini /* Non-symmetric case : It should be \Psi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 4303d12edf2fSStefano Zampini if (pcbddc->dbg_flag) { 430488ebb749SStefano Zampini Mat coarse_sub_mat; 430525084f0cSStefano Zampini Mat AUXMAT,TM1,TM2,TM3,TM4; 430688ebb749SStefano Zampini Mat coarse_phi_D,coarse_phi_B; 430788ebb749SStefano Zampini Mat coarse_psi_D,coarse_psi_B; 430888ebb749SStefano Zampini Mat A_II,A_BB,A_IB,A_BI; 43098bec7fa6SStefano Zampini Mat C_B,CPHI; 43108bec7fa6SStefano Zampini IS is_dummy; 43118bec7fa6SStefano Zampini Vec mones; 431288ebb749SStefano Zampini MatType checkmattype=MATSEQAIJ; 431388ebb749SStefano Zampini PetscReal real_value; 431488ebb749SStefano Zampini 4315a3df083aSStefano Zampini if (pcbddc->benign_n && !pcbddc->benign_change_explicit) { 4316a3df083aSStefano Zampini Mat A; 4317a3df083aSStefano Zampini ierr = PCBDDCBenignProject(pc,NULL,NULL,&A);CHKERRQ(ierr); 43187dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_I_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 43197dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 43207dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 43217dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 4322a3df083aSStefano Zampini ierr = MatDestroy(&A);CHKERRQ(ierr); 4323a3df083aSStefano Zampini } else { 432488ebb749SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 432588ebb749SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 432688ebb749SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 432788ebb749SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 4328a3df083aSStefano Zampini } 432988ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 433088ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 4331ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 433288ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_psi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_D);CHKERRQ(ierr); 433388ebb749SStefano Zampini ierr = MatConvert(pcbddc->coarse_psi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_B);CHKERRQ(ierr); 433488ebb749SStefano Zampini } 433588ebb749SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 433688ebb749SStefano Zampini 433725084f0cSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 43383301b35fSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check coarse sub mat computation (symmetric %d)\n",pcbddc->symmetric_primal);CHKERRQ(ierr); 433925084f0cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 4340ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 434188ebb749SStefano Zampini ierr = MatMatMult(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 434288ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 434388ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 434488ebb749SStefano Zampini ierr = MatMatMult(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 434588ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 434688ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 434788ebb749SStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 434888ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 434988ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 435088ebb749SStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 435188ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 435288ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 435388ebb749SStefano Zampini } else { 435488ebb749SStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 435588ebb749SStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 435688ebb749SStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 435788ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 435888ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 435988ebb749SStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 436088ebb749SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 436188ebb749SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 436288ebb749SStefano Zampini } 436388ebb749SStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 436488ebb749SStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 436588ebb749SStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 4366511c6705SHong Zhang ierr = MatConvert(TM1,MATSEQDENSE,MAT_INPLACE_MATRIX,&TM1);CHKERRQ(ierr); 43674f1b2e48SStefano Zampini if (pcbddc->benign_n) { 4368fc227af8SStefano Zampini Mat B0_B,B0_BPHI; 4369d12edf2fSStefano Zampini PetscScalar *data,*data2; 43704f1b2e48SStefano Zampini PetscInt j; 4371d12edf2fSStefano Zampini 43724f1b2e48SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr); 43737dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->benign_B0,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr); 4374d12edf2fSStefano Zampini ierr = MatMatMult(B0_B,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&B0_BPHI);CHKERRQ(ierr); 437586c38910SStefano Zampini ierr = MatConvert(B0_BPHI,MATSEQDENSE,MAT_INPLACE_MATRIX,&B0_BPHI);CHKERRQ(ierr); 4376d12edf2fSStefano Zampini ierr = MatDenseGetArray(TM1,&data);CHKERRQ(ierr); 4377d12edf2fSStefano Zampini ierr = MatDenseGetArray(B0_BPHI,&data2);CHKERRQ(ierr); 43784f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) { 43794f1b2e48SStefano Zampini PetscInt primal_idx = pcbddc->local_primal_size - pcbddc->benign_n + j; 4380d12edf2fSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 43814f1b2e48SStefano Zampini data[primal_idx*pcbddc->local_primal_size+i] += data2[i*pcbddc->benign_n+j]; 43824f1b2e48SStefano Zampini data[i*pcbddc->local_primal_size+primal_idx] += data2[i*pcbddc->benign_n+j]; 43834f1b2e48SStefano Zampini } 4384d12edf2fSStefano Zampini } 4385d12edf2fSStefano Zampini ierr = MatDenseRestoreArray(TM1,&data);CHKERRQ(ierr); 4386d12edf2fSStefano Zampini ierr = MatDenseRestoreArray(B0_BPHI,&data2);CHKERRQ(ierr); 4387d12edf2fSStefano Zampini ierr = MatDestroy(&B0_B);CHKERRQ(ierr); 4388d12edf2fSStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 4389d12edf2fSStefano Zampini ierr = MatDestroy(&B0_BPHI);CHKERRQ(ierr); 4390d12edf2fSStefano Zampini } 4391d12edf2fSStefano Zampini #if 0 4392d12edf2fSStefano Zampini { 4393d12edf2fSStefano Zampini PetscViewer viewer; 4394d12edf2fSStefano Zampini char filename[256]; 4395ffd830a3SStefano Zampini sprintf(filename,"details_local_coarse_mat%d_level%d.m",PetscGlobalRank,pcbddc->current_level); 4396d12edf2fSStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&viewer);CHKERRQ(ierr); 4397d12edf2fSStefano Zampini ierr = PetscViewerSetFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 4398ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)coarse_sub_mat,"computed");CHKERRQ(ierr); 4399ffd830a3SStefano Zampini ierr = MatView(coarse_sub_mat,viewer);CHKERRQ(ierr); 4400ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)TM1,"projected");CHKERRQ(ierr); 4401d12edf2fSStefano Zampini ierr = MatView(TM1,viewer);CHKERRQ(ierr); 440272b8c272SStefano Zampini if (save_change) { 440372b8c272SStefano Zampini Mat phi_B; 440472b8c272SStefano Zampini ierr = MatMatMult(save_change,pcbddc->coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&phi_B);CHKERRQ(ierr); 440572b8c272SStefano Zampini ierr = PetscObjectSetName((PetscObject)phi_B,"phi_B");CHKERRQ(ierr); 440672b8c272SStefano Zampini ierr = MatView(phi_B,viewer);CHKERRQ(ierr); 440772b8c272SStefano Zampini ierr = MatDestroy(&phi_B);CHKERRQ(ierr); 440872b8c272SStefano Zampini } else { 4409ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_phi_B,"phi_B");CHKERRQ(ierr); 4410ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_phi_B,viewer);CHKERRQ(ierr); 441172b8c272SStefano Zampini } 4412ffd830a3SStefano Zampini if (pcbddc->coarse_phi_D) { 4413ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_phi_D,"phi_D");CHKERRQ(ierr); 4414ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_phi_D,viewer);CHKERRQ(ierr); 4415ffd830a3SStefano Zampini } 4416ffd830a3SStefano Zampini if (pcbddc->coarse_psi_B) { 4417ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_psi_B,"psi_B");CHKERRQ(ierr); 4418ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_psi_B,viewer);CHKERRQ(ierr); 4419ffd830a3SStefano Zampini } 442072b8c272SStefano Zampini if (pcbddc->coarse_psi_D) { 4421ffd830a3SStefano Zampini ierr = PetscObjectSetName((PetscObject)pcbddc->coarse_psi_D,"psi_D");CHKERRQ(ierr); 4422ffd830a3SStefano Zampini ierr = MatView(pcbddc->coarse_psi_D,viewer);CHKERRQ(ierr); 4423ffd830a3SStefano Zampini } 4424d12edf2fSStefano Zampini ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 4425d12edf2fSStefano Zampini } 4426d12edf2fSStefano Zampini #endif 442781d9aea3SBarry Smith ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 44288bec7fa6SStefano Zampini ierr = MatNorm(TM1,NORM_FROBENIUS,&real_value);CHKERRQ(ierr); 44291575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 443006656605SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d matrix error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr); 44318bec7fa6SStefano Zampini 44328bec7fa6SStefano Zampini /* check constraints */ 4433a00504b5SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size-pcbddc->benign_n,0,1,&is_dummy);CHKERRQ(ierr); 44347dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->ConstraintMatrix,is_dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&C_B);CHKERRQ(ierr); 44354f1b2e48SStefano Zampini if (!pcbddc->benign_n) { /* TODO: add benign case */ 44368bec7fa6SStefano Zampini ierr = MatMatMult(C_B,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&CPHI);CHKERRQ(ierr); 4437a00504b5SStefano Zampini } else { 4438a00504b5SStefano Zampini PetscScalar *data; 4439a00504b5SStefano Zampini Mat tmat; 4440a00504b5SStefano Zampini ierr = MatDenseGetArray(pcbddc->coarse_phi_B,&data);CHKERRQ(ierr); 4441a00504b5SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcis->n_B,pcbddc->local_primal_size-pcbddc->benign_n,data,&tmat);CHKERRQ(ierr); 4442a00504b5SStefano Zampini ierr = MatDenseRestoreArray(pcbddc->coarse_phi_B,&data);CHKERRQ(ierr); 4443a00504b5SStefano Zampini ierr = MatMatMult(C_B,tmat,MAT_INITIAL_MATRIX,1.0,&CPHI);CHKERRQ(ierr); 4444a00504b5SStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 4445a00504b5SStefano Zampini } 44468bec7fa6SStefano Zampini ierr = MatCreateVecs(CPHI,&mones,NULL);CHKERRQ(ierr); 44478bec7fa6SStefano Zampini ierr = VecSet(mones,-1.0);CHKERRQ(ierr); 44488bec7fa6SStefano Zampini ierr = MatDiagonalSet(CPHI,mones,ADD_VALUES);CHKERRQ(ierr); 44498bec7fa6SStefano Zampini ierr = MatNorm(CPHI,NORM_FROBENIUS,&real_value);CHKERRQ(ierr); 4450bdae7319SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d phi constraints error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr); 4451ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 4452bdae7319SStefano Zampini ierr = MatMatMult(C_B,coarse_psi_B,MAT_REUSE_MATRIX,1.0,&CPHI);CHKERRQ(ierr); 4453bdae7319SStefano Zampini ierr = VecSet(mones,-1.0);CHKERRQ(ierr); 4454bdae7319SStefano Zampini ierr = MatDiagonalSet(CPHI,mones,ADD_VALUES);CHKERRQ(ierr); 4455bdae7319SStefano Zampini ierr = MatNorm(CPHI,NORM_FROBENIUS,&real_value);CHKERRQ(ierr); 4456bdae7319SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d psi constraints error % 1.14e\n",PetscGlobalRank,real_value);CHKERRQ(ierr); 445788ebb749SStefano Zampini } 44588bec7fa6SStefano Zampini ierr = MatDestroy(&C_B);CHKERRQ(ierr); 44598bec7fa6SStefano Zampini ierr = MatDestroy(&CPHI);CHKERRQ(ierr); 44608bec7fa6SStefano Zampini ierr = ISDestroy(&is_dummy);CHKERRQ(ierr); 44618bec7fa6SStefano Zampini ierr = VecDestroy(&mones);CHKERRQ(ierr); 446225084f0cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 446388ebb749SStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 446488ebb749SStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 446588ebb749SStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 446688ebb749SStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 446788ebb749SStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 446888ebb749SStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 446988ebb749SStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 447088ebb749SStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 447188ebb749SStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 447288ebb749SStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 4473ffd830a3SStefano Zampini if (!pcbddc->symmetric_primal) { 447488ebb749SStefano Zampini ierr = MatDestroy(&coarse_psi_D);CHKERRQ(ierr); 447588ebb749SStefano Zampini ierr = MatDestroy(&coarse_psi_B);CHKERRQ(ierr); 447688ebb749SStefano Zampini } 447788ebb749SStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 447888ebb749SStefano Zampini } 44798629588bSStefano Zampini /* get back data */ 44808629588bSStefano Zampini *coarse_submat_vals_n = coarse_submat_vals; 448188ebb749SStefano Zampini PetscFunctionReturn(0); 448288ebb749SStefano Zampini } 448388ebb749SStefano Zampini 44847dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrixUnsorted(Mat A, IS isrow, IS iscol, Mat* B) 4485aa0d41d4SStefano Zampini { 4486d65f70fdSStefano Zampini Mat *work_mat; 4487d65f70fdSStefano Zampini IS isrow_s,iscol_s; 4488d65f70fdSStefano Zampini PetscBool rsorted,csorted; 4489c43ebad9SStefano Zampini PetscInt rsize,*idxs_perm_r=NULL,csize,*idxs_perm_c=NULL; 4490aa0d41d4SStefano Zampini PetscErrorCode ierr; 4491aa0d41d4SStefano Zampini 4492aa0d41d4SStefano Zampini PetscFunctionBegin; 4493d65f70fdSStefano Zampini ierr = ISSorted(isrow,&rsorted);CHKERRQ(ierr); 4494d65f70fdSStefano Zampini ierr = ISSorted(iscol,&csorted);CHKERRQ(ierr); 4495d65f70fdSStefano Zampini ierr = ISGetLocalSize(isrow,&rsize);CHKERRQ(ierr); 4496d65f70fdSStefano Zampini ierr = ISGetLocalSize(iscol,&csize);CHKERRQ(ierr); 4497aa0d41d4SStefano Zampini 4498d65f70fdSStefano Zampini if (!rsorted) { 4499906d46d4SStefano Zampini const PetscInt *idxs; 4500906d46d4SStefano Zampini PetscInt *idxs_sorted,i; 4501aa0d41d4SStefano Zampini 4502d65f70fdSStefano Zampini ierr = PetscMalloc1(rsize,&idxs_perm_r);CHKERRQ(ierr); 4503d65f70fdSStefano Zampini ierr = PetscMalloc1(rsize,&idxs_sorted);CHKERRQ(ierr); 4504d65f70fdSStefano Zampini for (i=0;i<rsize;i++) { 4505d65f70fdSStefano Zampini idxs_perm_r[i] = i; 4506aa0d41d4SStefano Zampini } 4507d65f70fdSStefano Zampini ierr = ISGetIndices(isrow,&idxs);CHKERRQ(ierr); 4508d65f70fdSStefano Zampini ierr = PetscSortIntWithPermutation(rsize,idxs,idxs_perm_r);CHKERRQ(ierr); 4509d65f70fdSStefano Zampini for (i=0;i<rsize;i++) { 4510d65f70fdSStefano Zampini idxs_sorted[i] = idxs[idxs_perm_r[i]]; 4511aa0d41d4SStefano Zampini } 4512d65f70fdSStefano Zampini ierr = ISRestoreIndices(isrow,&idxs);CHKERRQ(ierr); 4513d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,rsize,idxs_sorted,PETSC_OWN_POINTER,&isrow_s);CHKERRQ(ierr); 4514d65f70fdSStefano Zampini } else { 4515d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)isrow);CHKERRQ(ierr); 4516d65f70fdSStefano Zampini isrow_s = isrow; 4517aa0d41d4SStefano Zampini } 4518906d46d4SStefano Zampini 4519d65f70fdSStefano Zampini if (!csorted) { 4520d65f70fdSStefano Zampini if (isrow == iscol) { 4521d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)isrow_s);CHKERRQ(ierr); 4522d65f70fdSStefano Zampini iscol_s = isrow_s; 4523d65f70fdSStefano Zampini } else { 4524d65f70fdSStefano Zampini const PetscInt *idxs; 4525d65f70fdSStefano Zampini PetscInt *idxs_sorted,i; 4526906d46d4SStefano Zampini 4527d65f70fdSStefano Zampini ierr = PetscMalloc1(csize,&idxs_perm_c);CHKERRQ(ierr); 4528d65f70fdSStefano Zampini ierr = PetscMalloc1(csize,&idxs_sorted);CHKERRQ(ierr); 4529d65f70fdSStefano Zampini for (i=0;i<csize;i++) { 4530d65f70fdSStefano Zampini idxs_perm_c[i] = i; 4531d65f70fdSStefano Zampini } 4532d65f70fdSStefano Zampini ierr = ISGetIndices(iscol,&idxs);CHKERRQ(ierr); 4533d65f70fdSStefano Zampini ierr = PetscSortIntWithPermutation(csize,idxs,idxs_perm_c);CHKERRQ(ierr); 4534d65f70fdSStefano Zampini for (i=0;i<csize;i++) { 4535d65f70fdSStefano Zampini idxs_sorted[i] = idxs[idxs_perm_c[i]]; 4536d65f70fdSStefano Zampini } 4537d65f70fdSStefano Zampini ierr = ISRestoreIndices(iscol,&idxs);CHKERRQ(ierr); 4538d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,csize,idxs_sorted,PETSC_OWN_POINTER,&iscol_s);CHKERRQ(ierr); 4539d65f70fdSStefano Zampini } 4540d65f70fdSStefano Zampini } else { 4541d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)iscol);CHKERRQ(ierr); 4542d65f70fdSStefano Zampini iscol_s = iscol; 4543d65f70fdSStefano Zampini } 4544d65f70fdSStefano Zampini 45457dae84e0SHong Zhang ierr = MatCreateSubMatrices(A,1,&isrow_s,&iscol_s,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 4546d65f70fdSStefano Zampini 4547d65f70fdSStefano Zampini if (!rsorted || !csorted) { 4548906d46d4SStefano Zampini Mat new_mat; 4549d65f70fdSStefano Zampini IS is_perm_r,is_perm_c; 4550906d46d4SStefano Zampini 4551d65f70fdSStefano Zampini if (!rsorted) { 4552d65f70fdSStefano Zampini PetscInt *idxs_r,i; 4553d65f70fdSStefano Zampini ierr = PetscMalloc1(rsize,&idxs_r);CHKERRQ(ierr); 4554d65f70fdSStefano Zampini for (i=0;i<rsize;i++) { 4555d65f70fdSStefano Zampini idxs_r[idxs_perm_r[i]] = i; 4556906d46d4SStefano Zampini } 4557d65f70fdSStefano Zampini ierr = PetscFree(idxs_perm_r);CHKERRQ(ierr); 4558d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,rsize,idxs_r,PETSC_OWN_POINTER,&is_perm_r);CHKERRQ(ierr); 4559d65f70fdSStefano Zampini } else { 4560d65f70fdSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,rsize,0,1,&is_perm_r);CHKERRQ(ierr); 4561906d46d4SStefano Zampini } 4562d65f70fdSStefano Zampini ierr = ISSetPermutation(is_perm_r);CHKERRQ(ierr); 4563d65f70fdSStefano Zampini 4564d65f70fdSStefano Zampini if (!csorted) { 4565d65f70fdSStefano Zampini if (isrow_s == iscol_s) { 4566d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)is_perm_r);CHKERRQ(ierr); 4567d65f70fdSStefano Zampini is_perm_c = is_perm_r; 4568d65f70fdSStefano Zampini } else { 4569d65f70fdSStefano Zampini PetscInt *idxs_c,i; 4570f913dca9SStefano Zampini if (!idxs_perm_c) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Permutation array not present"); 4571d65f70fdSStefano Zampini ierr = PetscMalloc1(csize,&idxs_c);CHKERRQ(ierr); 4572d65f70fdSStefano Zampini for (i=0;i<csize;i++) { 4573d65f70fdSStefano Zampini idxs_c[idxs_perm_c[i]] = i; 4574d65f70fdSStefano Zampini } 4575d65f70fdSStefano Zampini ierr = PetscFree(idxs_perm_c);CHKERRQ(ierr); 4576d65f70fdSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,csize,idxs_c,PETSC_OWN_POINTER,&is_perm_c);CHKERRQ(ierr); 4577d65f70fdSStefano Zampini } 4578d65f70fdSStefano Zampini } else { 4579d65f70fdSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,csize,0,1,&is_perm_c);CHKERRQ(ierr); 4580d65f70fdSStefano Zampini } 4581d65f70fdSStefano Zampini ierr = ISSetPermutation(is_perm_c);CHKERRQ(ierr); 4582d65f70fdSStefano Zampini 4583d65f70fdSStefano Zampini ierr = MatPermute(work_mat[0],is_perm_r,is_perm_c,&new_mat);CHKERRQ(ierr); 4584d65f70fdSStefano Zampini ierr = MatDestroy(&work_mat[0]);CHKERRQ(ierr); 4585d65f70fdSStefano Zampini work_mat[0] = new_mat; 4586d65f70fdSStefano Zampini ierr = ISDestroy(&is_perm_r);CHKERRQ(ierr); 4587d65f70fdSStefano Zampini ierr = ISDestroy(&is_perm_c);CHKERRQ(ierr); 4588d65f70fdSStefano Zampini } 4589d65f70fdSStefano Zampini 4590d65f70fdSStefano Zampini ierr = PetscObjectReference((PetscObject)work_mat[0]);CHKERRQ(ierr); 4591d65f70fdSStefano Zampini *B = work_mat[0]; 4592d65f70fdSStefano Zampini ierr = MatDestroyMatrices(1,&work_mat);CHKERRQ(ierr); 4593d65f70fdSStefano Zampini ierr = ISDestroy(&isrow_s);CHKERRQ(ierr); 4594d65f70fdSStefano Zampini ierr = ISDestroy(&iscol_s);CHKERRQ(ierr); 4595d65f70fdSStefano Zampini PetscFunctionReturn(0); 4596d65f70fdSStefano Zampini } 4597d65f70fdSStefano Zampini 45985e8657edSStefano Zampini PetscErrorCode PCBDDCComputeLocalMatrix(PC pc, Mat ChangeOfBasisMatrix) 4599aa0d41d4SStefano Zampini { 4600aa0d41d4SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 46015e8657edSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 4602022d8d2bSstefano_zampini Mat new_mat,lA; 46035e8657edSStefano Zampini IS is_local,is_global; 4604d65f70fdSStefano Zampini PetscInt local_size; 4605d65f70fdSStefano Zampini PetscBool isseqaij; 4606aa0d41d4SStefano Zampini PetscErrorCode ierr; 4607aa0d41d4SStefano Zampini 4608aa0d41d4SStefano Zampini PetscFunctionBegin; 4609aa0d41d4SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 46105e8657edSStefano Zampini ierr = MatGetSize(matis->A,&local_size,NULL);CHKERRQ(ierr); 46115e8657edSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)matis->A),local_size,0,1,&is_local);CHKERRQ(ierr); 4612b087196eSStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pc->pmat->rmap->mapping,is_local,&is_global);CHKERRQ(ierr); 4613aa0d41d4SStefano Zampini ierr = ISDestroy(&is_local);CHKERRQ(ierr); 46147dae84e0SHong Zhang ierr = MatCreateSubMatrixUnsorted(ChangeOfBasisMatrix,is_global,is_global,&new_mat);CHKERRQ(ierr); 4615aa0d41d4SStefano Zampini ierr = ISDestroy(&is_global);CHKERRQ(ierr); 4616906d46d4SStefano Zampini 4617906d46d4SStefano Zampini /* check */ 4618906d46d4SStefano Zampini if (pcbddc->dbg_flag) { 4619906d46d4SStefano Zampini Vec x,x_change; 4620906d46d4SStefano Zampini PetscReal error; 4621906d46d4SStefano Zampini 46225e8657edSStefano Zampini ierr = MatCreateVecs(ChangeOfBasisMatrix,&x,&x_change);CHKERRQ(ierr); 4623906d46d4SStefano Zampini ierr = VecSetRandom(x,NULL);CHKERRQ(ierr); 46245e8657edSStefano Zampini ierr = MatMult(ChangeOfBasisMatrix,x,x_change);CHKERRQ(ierr); 4625e176bc59SStefano Zampini ierr = VecScatterBegin(matis->cctx,x,matis->x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4626e176bc59SStefano Zampini ierr = VecScatterEnd(matis->cctx,x,matis->x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4627d65f70fdSStefano Zampini ierr = MatMult(new_mat,matis->x,matis->y);CHKERRQ(ierr); 462888428137SStefano Zampini if (!pcbddc->change_interior) { 462988428137SStefano Zampini const PetscScalar *x,*y,*v; 463088428137SStefano Zampini PetscReal lerror = 0.; 463188428137SStefano Zampini PetscInt i; 463288428137SStefano Zampini 463388428137SStefano Zampini ierr = VecGetArrayRead(matis->x,&x);CHKERRQ(ierr); 463488428137SStefano Zampini ierr = VecGetArrayRead(matis->y,&y);CHKERRQ(ierr); 463588428137SStefano Zampini ierr = VecGetArrayRead(matis->counter,&v);CHKERRQ(ierr); 463688428137SStefano Zampini for (i=0;i<local_size;i++) 463788428137SStefano Zampini if (PetscRealPart(v[i]) < 1.5 && PetscAbsScalar(x[i]-y[i]) > lerror) 463888428137SStefano Zampini lerror = PetscAbsScalar(x[i]-y[i]); 463988428137SStefano Zampini ierr = VecRestoreArrayRead(matis->x,&x);CHKERRQ(ierr); 464088428137SStefano Zampini ierr = VecRestoreArrayRead(matis->y,&y);CHKERRQ(ierr); 464188428137SStefano Zampini ierr = VecRestoreArrayRead(matis->counter,&v);CHKERRQ(ierr); 464288428137SStefano Zampini ierr = MPIU_Allreduce(&lerror,&error,1,MPIU_REAL,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 4643637e8532SStefano Zampini if (error > PETSC_SMALL) { 4644637e8532SStefano Zampini if (!pcbddc->user_ChangeOfBasisMatrix || pcbddc->current_level) { 4645637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on I: %1.6e\n",error); 4646637e8532SStefano Zampini } else { 4647637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Error global vs local change on I: %1.6e\n",error); 4648637e8532SStefano Zampini } 4649637e8532SStefano Zampini } 465088428137SStefano Zampini } 4651e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,matis->y,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4652e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,matis->y,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4653906d46d4SStefano Zampini ierr = VecAXPY(x,-1.0,x_change);CHKERRQ(ierr); 4654906d46d4SStefano Zampini ierr = VecNorm(x,NORM_INFINITY,&error);CHKERRQ(ierr); 4655637e8532SStefano Zampini if (error > PETSC_SMALL) { 4656637e8532SStefano Zampini if (!pcbddc->user_ChangeOfBasisMatrix || pcbddc->current_level) { 4657637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on N: %1.6e\n",error); 4658637e8532SStefano Zampini } else { 4659637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_USER,"Error global vs local change on N: %1.6e\n",error); 4660637e8532SStefano Zampini } 4661637e8532SStefano Zampini } 4662906d46d4SStefano Zampini ierr = VecDestroy(&x);CHKERRQ(ierr); 4663906d46d4SStefano Zampini ierr = VecDestroy(&x_change);CHKERRQ(ierr); 4664906d46d4SStefano Zampini } 4665906d46d4SStefano Zampini 4666022d8d2bSstefano_zampini /* lA is present if we are setting up an inner BDDC for a saddle point FETI-DP */ 4667022d8d2bSstefano_zampini ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject*)&lA);CHKERRQ(ierr); 4668022d8d2bSstefano_zampini 466922d5777bSStefano Zampini /* TODO: HOW TO WORK WITH BAIJ and SBAIJ and SEQDENSE? */ 46709b28b3ffSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)matis->A,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 467122d5777bSStefano Zampini if (isseqaij) { 4672a00504b5SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 4673a00504b5SStefano Zampini ierr = MatPtAP(matis->A,new_mat,MAT_INITIAL_MATRIX,2.0,&pcbddc->local_mat);CHKERRQ(ierr); 4674022d8d2bSstefano_zampini if (lA) { 4675022d8d2bSstefano_zampini Mat work; 4676022d8d2bSstefano_zampini ierr = MatPtAP(lA,new_mat,MAT_INITIAL_MATRIX,2.0,&work);CHKERRQ(ierr); 4677022d8d2bSstefano_zampini ierr = PetscObjectCompose((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject)work);CHKERRQ(ierr); 4678022d8d2bSstefano_zampini ierr = MatDestroy(&work);CHKERRQ(ierr); 4679022d8d2bSstefano_zampini } 4680aa0d41d4SStefano Zampini } else { 4681a00504b5SStefano Zampini Mat work_mat; 46821cf9b237SStefano Zampini 4683a00504b5SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 4684aa0d41d4SStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 4685a00504b5SStefano Zampini ierr = MatPtAP(work_mat,new_mat,MAT_INITIAL_MATRIX,2.0,&pcbddc->local_mat);CHKERRQ(ierr); 46861d82a3b6SStefano Zampini ierr = MatDestroy(&work_mat);CHKERRQ(ierr); 4687022d8d2bSstefano_zampini if (lA) { 4688022d8d2bSstefano_zampini Mat work; 4689022d8d2bSstefano_zampini ierr = MatConvert(lA,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 4690022d8d2bSstefano_zampini ierr = MatPtAP(work_mat,new_mat,MAT_INITIAL_MATRIX,2.0,&work);CHKERRQ(ierr); 4691022d8d2bSstefano_zampini ierr = PetscObjectCompose((PetscObject)pc,"__KSPFETIDP_lA" ,(PetscObject)work);CHKERRQ(ierr); 4692022d8d2bSstefano_zampini ierr = MatDestroy(&work);CHKERRQ(ierr); 4693022d8d2bSstefano_zampini } 4694aa0d41d4SStefano Zampini } 46953301b35fSStefano Zampini if (matis->A->symmetric_set) { 46963301b35fSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_SYMMETRIC,matis->A->symmetric);CHKERRQ(ierr); 4697e496cd5dSStefano Zampini #if !defined(PETSC_USE_COMPLEX) 46983301b35fSStefano Zampini ierr = MatSetOption(pcbddc->local_mat,MAT_HERMITIAN,matis->A->symmetric);CHKERRQ(ierr); 4699e496cd5dSStefano Zampini #endif 47003301b35fSStefano Zampini } 4701d65f70fdSStefano Zampini ierr = MatDestroy(&new_mat);CHKERRQ(ierr); 4702aa0d41d4SStefano Zampini PetscFunctionReturn(0); 4703aa0d41d4SStefano Zampini } 4704aa0d41d4SStefano Zampini 47058ce42a96SStefano Zampini PetscErrorCode PCBDDCSetUpLocalScatters(PC pc) 4706a64d13efSStefano Zampini { 4707a64d13efSStefano Zampini PC_IS* pcis = (PC_IS*)(pc->data); 4708a64d13efSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 4709d62866d3SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 471053892102SStefano Zampini PetscInt *idx_R_local=NULL; 47113a50541eSStefano Zampini PetscInt n_vertices,i,j,n_R,n_D,n_B; 47123a50541eSStefano Zampini PetscInt vbs,bs; 47136816873aSStefano Zampini PetscBT bitmask=NULL; 4714a64d13efSStefano Zampini PetscErrorCode ierr; 4715a64d13efSStefano Zampini 4716a64d13efSStefano Zampini PetscFunctionBegin; 4717b23d619eSStefano Zampini /* 4718b23d619eSStefano Zampini No need to setup local scatters if 4719b23d619eSStefano Zampini - primal space is unchanged 4720b23d619eSStefano Zampini AND 4721b23d619eSStefano Zampini - we actually have locally some primal dofs (could not be true in multilevel or for isolated subdomains) 4722b23d619eSStefano Zampini AND 4723b23d619eSStefano Zampini - we are not in debugging mode (this is needed since there are Synchronized prints at the end of the subroutine 4724b23d619eSStefano Zampini */ 4725b23d619eSStefano Zampini if (!pcbddc->new_primal_space_local && pcbddc->local_primal_size && !pcbddc->dbg_flag) { 4726f4ddd8eeSStefano Zampini PetscFunctionReturn(0); 4727f4ddd8eeSStefano Zampini } 4728f4ddd8eeSStefano Zampini /* destroy old objects */ 4729f4ddd8eeSStefano Zampini ierr = ISDestroy(&pcbddc->is_R_local);CHKERRQ(ierr); 4730f4ddd8eeSStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 4731f4ddd8eeSStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 4732a64d13efSStefano Zampini /* Set Non-overlapping dimensions */ 4733b371cd4fSStefano Zampini n_B = pcis->n_B; 4734b371cd4fSStefano Zampini n_D = pcis->n - n_B; 4735b371cd4fSStefano Zampini n_vertices = pcbddc->n_vertices; 47363a50541eSStefano Zampini 4737a64d13efSStefano Zampini /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 47386816873aSStefano Zampini 473953892102SStefano Zampini /* create auxiliary bitmask and allocate workspace */ 4740b334f244SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) { 4741854ce69bSBarry Smith ierr = PetscMalloc1(pcis->n-n_vertices,&idx_R_local);CHKERRQ(ierr); 4742a64d13efSStefano Zampini ierr = PetscBTCreate(pcis->n,&bitmask);CHKERRQ(ierr); 4743a64d13efSStefano Zampini for (i=0;i<n_vertices;i++) { 47440e6343abSStefano Zampini ierr = PetscBTSet(bitmask,pcbddc->local_primal_ref_node[i]);CHKERRQ(ierr); 4745a64d13efSStefano Zampini } 4746a64d13efSStefano Zampini 4747a64d13efSStefano Zampini for (i=0, n_R=0; i<pcis->n; i++) { 47484641a718SStefano Zampini if (!PetscBTLookup(bitmask,i)) { 47496816873aSStefano Zampini idx_R_local[n_R++] = i; 4750a64d13efSStefano Zampini } 4751a64d13efSStefano Zampini } 4752df4d28bfSStefano Zampini } else { /* A different ordering (already computed) is present if we are reusing the Schur solver */ 4753df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 47546816873aSStefano Zampini 4755df4d28bfSStefano Zampini ierr = ISGetIndices(reuse_solver->is_R,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4756df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->is_R,&n_R);CHKERRQ(ierr); 47576816873aSStefano Zampini } 47583a50541eSStefano Zampini 47593a50541eSStefano Zampini /* Block code */ 47603a50541eSStefano Zampini vbs = 1; 47613a50541eSStefano Zampini ierr = MatGetBlockSize(pcbddc->local_mat,&bs);CHKERRQ(ierr); 47623a50541eSStefano Zampini if (bs>1 && !(n_vertices%bs)) { 47633a50541eSStefano Zampini PetscBool is_blocked = PETSC_TRUE; 47643a50541eSStefano Zampini PetscInt *vary; 4765b334f244SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) { 4766785e854fSJed Brown ierr = PetscMalloc1(pcis->n/bs,&vary);CHKERRQ(ierr); 47673a50541eSStefano Zampini ierr = PetscMemzero(vary,pcis->n/bs*sizeof(PetscInt));CHKERRQ(ierr); 4768d3df7717SStefano Zampini /* Verify that the vertex indices correspond to each element in a block (code taken from sbaij2.c) */ 4769d3df7717SStefano Zampini /* it is ok to check this way since local_primal_ref_node are always sorted by local numbering and idx_R_local is obtained as a complement */ 47700e6343abSStefano Zampini for (i=0; i<n_vertices; i++) vary[pcbddc->local_primal_ref_node[i]/bs]++; 4771d3df7717SStefano Zampini for (i=0; i<pcis->n/bs; i++) { 47723a50541eSStefano Zampini if (vary[i]!=0 && vary[i]!=bs) { 47733a50541eSStefano Zampini is_blocked = PETSC_FALSE; 47743a50541eSStefano Zampini break; 47753a50541eSStefano Zampini } 47763a50541eSStefano Zampini } 4777d3df7717SStefano Zampini ierr = PetscFree(vary);CHKERRQ(ierr); 4778d3df7717SStefano Zampini } else { 4779d3df7717SStefano Zampini /* Verify directly the R set */ 4780d3df7717SStefano Zampini for (i=0; i<n_R/bs; i++) { 4781d3df7717SStefano Zampini PetscInt j,node=idx_R_local[bs*i]; 4782d3df7717SStefano Zampini for (j=1; j<bs; j++) { 4783d3df7717SStefano Zampini if (node != idx_R_local[bs*i+j]-j) { 4784d3df7717SStefano Zampini is_blocked = PETSC_FALSE; 4785d3df7717SStefano Zampini break; 4786d3df7717SStefano Zampini } 4787d3df7717SStefano Zampini } 4788d3df7717SStefano Zampini } 4789d3df7717SStefano Zampini } 47903a50541eSStefano Zampini if (is_blocked) { /* build compressed IS for R nodes (complement of vertices) */ 47913a50541eSStefano Zampini vbs = bs; 47923a50541eSStefano Zampini for (i=0;i<n_R/vbs;i++) { 47933a50541eSStefano Zampini idx_R_local[i] = idx_R_local[vbs*i]/vbs; 47943a50541eSStefano Zampini } 47953a50541eSStefano Zampini } 47963a50541eSStefano Zampini } 47973a50541eSStefano Zampini ierr = ISCreateBlock(PETSC_COMM_SELF,vbs,n_R/vbs,idx_R_local,PETSC_COPY_VALUES,&pcbddc->is_R_local);CHKERRQ(ierr); 4798b334f244SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { 4799df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 480053892102SStefano Zampini 4801df4d28bfSStefano Zampini ierr = ISRestoreIndices(reuse_solver->is_R,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4802df4d28bfSStefano Zampini ierr = ISDestroy(&reuse_solver->is_R);CHKERRQ(ierr); 480353892102SStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->is_R_local);CHKERRQ(ierr); 4804df4d28bfSStefano Zampini reuse_solver->is_R = pcbddc->is_R_local; 480553892102SStefano Zampini } else { 48063a50541eSStefano Zampini ierr = PetscFree(idx_R_local);CHKERRQ(ierr); 480753892102SStefano Zampini } 4808a64d13efSStefano Zampini 4809a64d13efSStefano Zampini /* print some info if requested */ 4810a64d13efSStefano Zampini if (pcbddc->dbg_flag) { 4811a64d13efSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 4812a64d13efSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 48131575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 4814a64d13efSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 4815a64d13efSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 48164f1b2e48SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,pcbddc->local_primal_size-n_vertices-pcbddc->benign_n,pcbddc->local_primal_size);CHKERRQ(ierr); 4817a64d13efSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 4818a64d13efSStefano Zampini } 4819a64d13efSStefano Zampini 4820a64d13efSStefano Zampini /* VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 4821b334f244SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) { 48226816873aSStefano Zampini IS is_aux1,is_aux2; 48236816873aSStefano Zampini PetscInt *aux_array1,*aux_array2,*is_indices,*idx_R_local; 48246816873aSStefano Zampini 48253a50541eSStefano Zampini ierr = ISGetIndices(pcbddc->is_R_local,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4826854ce69bSBarry Smith ierr = PetscMalloc1(pcis->n_B-n_vertices,&aux_array1);CHKERRQ(ierr); 4827854ce69bSBarry Smith ierr = PetscMalloc1(pcis->n_B-n_vertices,&aux_array2);CHKERRQ(ierr); 4828a64d13efSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 48294641a718SStefano Zampini for (i=0; i<n_D; i++) { 48304641a718SStefano Zampini ierr = PetscBTSet(bitmask,is_indices[i]);CHKERRQ(ierr); 48314641a718SStefano Zampini } 4832a64d13efSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4833a64d13efSStefano Zampini for (i=0, j=0; i<n_R; i++) { 48344641a718SStefano Zampini if (!PetscBTLookup(bitmask,idx_R_local[i])) { 48354641a718SStefano Zampini aux_array1[j++] = i; 4836a64d13efSStefano Zampini } 4837a64d13efSStefano Zampini } 4838a64d13efSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_OWN_POINTER,&is_aux1);CHKERRQ(ierr); 4839a64d13efSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4840a64d13efSStefano Zampini for (i=0, j=0; i<n_B; i++) { 48414641a718SStefano Zampini if (!PetscBTLookup(bitmask,is_indices[i])) { 48424641a718SStefano Zampini aux_array2[j++] = i; 4843a64d13efSStefano Zampini } 4844a64d13efSStefano Zampini } 4845a64d13efSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4846a64d13efSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_OWN_POINTER,&is_aux2);CHKERRQ(ierr); 4847a64d13efSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 4848a64d13efSStefano Zampini ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 4849a64d13efSStefano Zampini ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 4850a64d13efSStefano Zampini 48518eeda7d8SStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 4852785e854fSJed Brown ierr = PetscMalloc1(n_D,&aux_array1);CHKERRQ(ierr); 4853a64d13efSStefano Zampini for (i=0, j=0; i<n_R; i++) { 48544641a718SStefano Zampini if (PetscBTLookup(bitmask,idx_R_local[i])) { 48554641a718SStefano Zampini aux_array1[j++] = i; 4856a64d13efSStefano Zampini } 4857a64d13efSStefano Zampini } 4858a64d13efSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_OWN_POINTER,&is_aux1);CHKERRQ(ierr); 4859a64d13efSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 4860a64d13efSStefano Zampini ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 4861a64d13efSStefano Zampini } 48624641a718SStefano Zampini ierr = PetscBTDestroy(&bitmask);CHKERRQ(ierr); 48633a50541eSStefano Zampini ierr = ISRestoreIndices(pcbddc->is_R_local,(const PetscInt**)&idx_R_local);CHKERRQ(ierr); 4864d62866d3SStefano Zampini } else { 4865df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 48666816873aSStefano Zampini IS tis; 48676816873aSStefano Zampini PetscInt schur_size; 48686816873aSStefano Zampini 4869df4d28bfSStefano Zampini ierr = ISGetLocalSize(reuse_solver->is_B,&schur_size);CHKERRQ(ierr); 48706816873aSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,schur_size,n_D,1,&tis);CHKERRQ(ierr); 4871df4d28bfSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,tis,pcis->vec1_B,reuse_solver->is_B,&pcbddc->R_to_B);CHKERRQ(ierr); 48726816873aSStefano Zampini ierr = ISDestroy(&tis);CHKERRQ(ierr); 48736816873aSStefano Zampini if (pcbddc->switch_static || pcbddc->dbg_flag) { 48746816873aSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_D,0,1,&tis);CHKERRQ(ierr); 48756816873aSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_R,tis,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 48766816873aSStefano Zampini ierr = ISDestroy(&tis);CHKERRQ(ierr); 4877d62866d3SStefano Zampini } 4878d62866d3SStefano Zampini } 4879a64d13efSStefano Zampini PetscFunctionReturn(0); 4880a64d13efSStefano Zampini } 4881a64d13efSStefano Zampini 4882304d26faSStefano Zampini 4883684f6988SStefano Zampini PetscErrorCode PCBDDCSetUpLocalSolvers(PC pc, PetscBool dirichlet, PetscBool neumann) 4884304d26faSStefano Zampini { 4885304d26faSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 4886304d26faSStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 4887304d26faSStefano Zampini PC pc_temp; 4888304d26faSStefano Zampini Mat A_RR; 4889f4ddd8eeSStefano Zampini MatReuse reuse; 4890304d26faSStefano Zampini PetscScalar m_one = -1.0; 4891304d26faSStefano Zampini PetscReal value; 489204708bb6SStefano Zampini PetscInt n_D,n_R; 4893c7017625SStefano Zampini PetscBool check_corr[2],issbaij; 4894304d26faSStefano Zampini PetscErrorCode ierr; 4895e604994aSStefano Zampini /* prefixes stuff */ 4896312be037SStefano Zampini char dir_prefix[256],neu_prefix[256],str_level[16]; 4897e604994aSStefano Zampini size_t len; 4898304d26faSStefano Zampini 4899304d26faSStefano Zampini PetscFunctionBegin; 4900304d26faSStefano Zampini 4901e604994aSStefano Zampini /* compute prefixes */ 4902e604994aSStefano Zampini ierr = PetscStrcpy(dir_prefix,"");CHKERRQ(ierr); 4903e604994aSStefano Zampini ierr = PetscStrcpy(neu_prefix,"");CHKERRQ(ierr); 4904e604994aSStefano Zampini if (!pcbddc->current_level) { 4905e604994aSStefano Zampini ierr = PetscStrcpy(dir_prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr); 4906e604994aSStefano Zampini ierr = PetscStrcpy(neu_prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr); 4907e604994aSStefano Zampini ierr = PetscStrcat(dir_prefix,"pc_bddc_dirichlet_");CHKERRQ(ierr); 4908e604994aSStefano Zampini ierr = PetscStrcat(neu_prefix,"pc_bddc_neumann_");CHKERRQ(ierr); 4909e604994aSStefano Zampini } else { 4910e604994aSStefano Zampini ierr = PetscStrcpy(str_level,"");CHKERRQ(ierr); 4911312be037SStefano Zampini sprintf(str_level,"l%d_",(int)(pcbddc->current_level)); 4912e604994aSStefano Zampini ierr = PetscStrlen(((PetscObject)pc)->prefix,&len);CHKERRQ(ierr); 4913e604994aSStefano Zampini len -= 15; /* remove "pc_bddc_coarse_" */ 4914312be037SStefano Zampini if (pcbddc->current_level>1) len -= 3; /* remove "lX_" with X level number */ 4915312be037SStefano Zampini if (pcbddc->current_level>10) len -= 1; /* remove another char from level number */ 491634d6797cSStefano Zampini ierr = PetscStrncpy(dir_prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr); 491734d6797cSStefano Zampini ierr = PetscStrncpy(neu_prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr); 4918e604994aSStefano Zampini ierr = PetscStrcat(dir_prefix,"pc_bddc_dirichlet_");CHKERRQ(ierr); 4919e604994aSStefano Zampini ierr = PetscStrcat(neu_prefix,"pc_bddc_neumann_");CHKERRQ(ierr); 4920e604994aSStefano Zampini ierr = PetscStrcat(dir_prefix,str_level);CHKERRQ(ierr); 4921e604994aSStefano Zampini ierr = PetscStrcat(neu_prefix,str_level);CHKERRQ(ierr); 4922e604994aSStefano Zampini } 4923e604994aSStefano Zampini 4924304d26faSStefano Zampini /* DIRICHLET PROBLEM */ 4925684f6988SStefano Zampini if (dirichlet) { 4926d5574798SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 4927450f8f5eSStefano Zampini if (pcbddc->benign_n && !pcbddc->benign_change_explicit) { 49289a962809SStefano Zampini if (!sub_schurs || !sub_schurs->reuse_solver) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not yet implemented\n"); 4929450f8f5eSStefano Zampini if (pcbddc->dbg_flag) { 4930a3df083aSStefano Zampini Mat A_IIn; 4931a3df083aSStefano Zampini 4932a3df083aSStefano Zampini ierr = PCBDDCBenignProject(pc,pcis->is_I_local,pcis->is_I_local,&A_IIn);CHKERRQ(ierr); 4933a3df083aSStefano Zampini ierr = MatDestroy(&pcis->A_II);CHKERRQ(ierr); 4934a3df083aSStefano Zampini pcis->A_II = A_IIn; 4935a3df083aSStefano Zampini } 4936450f8f5eSStefano Zampini } 49373301b35fSStefano Zampini if (pcbddc->local_mat->symmetric_set) { 49383301b35fSStefano Zampini ierr = MatSetOption(pcis->A_II,MAT_SYMMETRIC,pcbddc->local_mat->symmetric_set);CHKERRQ(ierr); 4939964fefecSStefano Zampini } 4940ac78edfcSStefano Zampini /* Matrix for Dirichlet problem is pcis->A_II */ 4941964fefecSStefano Zampini n_D = pcis->n - pcis->n_B; 4942304d26faSStefano Zampini if (!pcbddc->ksp_D) { /* create object if not yet build */ 4943304d26faSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 4944304d26faSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 4945304d26faSStefano Zampini /* default */ 4946304d26faSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 4947e604994aSStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,dir_prefix);CHKERRQ(ierr); 49489577ea80SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcis->A_II,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr); 4949304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 49509577ea80SStefano Zampini if (issbaij) { 49519577ea80SStefano Zampini ierr = PCSetType(pc_temp,PCCHOLESKY);CHKERRQ(ierr); 49529577ea80SStefano Zampini } else { 4953304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 49549577ea80SStefano Zampini } 4955304d26faSStefano Zampini /* Allow user's customization */ 4956304d26faSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 4957304d26faSStefano Zampini ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr); 4958304d26faSStefano Zampini } 4959d1e9a80fSBarry Smith ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II);CHKERRQ(ierr); 4960b334f244SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { 4961df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 4962d62866d3SStefano Zampini 4963df4d28bfSStefano Zampini ierr = KSPSetPC(pcbddc->ksp_D,reuse_solver->interior_solver);CHKERRQ(ierr); 4964d5574798SStefano Zampini } 4965304d26faSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero. TODO solve from umfpack interface */ 4966304d26faSStefano Zampini if (!n_D) { 4967304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 4968304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 4969304d26faSStefano Zampini } 4970304d26faSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 4971304d26faSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 4972304d26faSStefano Zampini /* set ksp_D into pcis data */ 4973304d26faSStefano Zampini ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr); 4974304d26faSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr); 4975304d26faSStefano Zampini pcis->ksp_D = pcbddc->ksp_D; 4976684f6988SStefano Zampini } 4977304d26faSStefano Zampini 4978304d26faSStefano Zampini /* NEUMANN PROBLEM */ 4979684f6988SStefano Zampini A_RR = 0; 4980684f6988SStefano Zampini if (neumann) { 4981d62866d3SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 498204708bb6SStefano Zampini PetscInt ibs,mbs; 49830aa714b2SStefano Zampini PetscBool issbaij, reuse_neumann_solver; 498404708bb6SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 49850aa714b2SStefano Zampini 49860aa714b2SStefano Zampini reuse_neumann_solver = PETSC_FALSE; 49870aa714b2SStefano Zampini if (sub_schurs && sub_schurs->reuse_solver) { 49880aa714b2SStefano Zampini IS iP; 49890aa714b2SStefano Zampini 49900aa714b2SStefano Zampini reuse_neumann_solver = PETSC_TRUE; 49910aa714b2SStefano Zampini ierr = PetscObjectQuery((PetscObject)sub_schurs->A,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr); 49920aa714b2SStefano Zampini if (iP) reuse_neumann_solver = PETSC_FALSE; 49930aa714b2SStefano Zampini } 4994f4ddd8eeSStefano Zampini /* Matrix for Neumann problem is A_RR -> we need to create/reuse it at this point */ 49958ce42a96SStefano Zampini ierr = ISGetSize(pcbddc->is_R_local,&n_R);CHKERRQ(ierr); 4996f4ddd8eeSStefano Zampini if (pcbddc->ksp_R) { /* already created ksp */ 4997f4ddd8eeSStefano Zampini PetscInt nn_R; 499881d9aea3SBarry Smith ierr = KSPGetOperators(pcbddc->ksp_R,NULL,&A_RR);CHKERRQ(ierr); 4999f4ddd8eeSStefano Zampini ierr = PetscObjectReference((PetscObject)A_RR);CHKERRQ(ierr); 5000f4ddd8eeSStefano Zampini ierr = MatGetSize(A_RR,&nn_R,NULL);CHKERRQ(ierr); 5001f4ddd8eeSStefano Zampini if (nn_R != n_R) { /* old ksp is not reusable, so reset it */ 5002f4ddd8eeSStefano Zampini ierr = KSPReset(pcbddc->ksp_R);CHKERRQ(ierr); 5003f4ddd8eeSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5004f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5005f4ddd8eeSStefano Zampini } else { /* same sizes, but nonzero pattern depend on primal vertices so it can be changed */ 5006727cdba6SStefano Zampini if (pcbddc->new_primal_space_local) { /* we are not sure the matrix will have the same nonzero pattern */ 5007f4ddd8eeSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5008f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5009f4ddd8eeSStefano Zampini } else { /* safe to reuse the matrix */ 5010f4ddd8eeSStefano Zampini reuse = MAT_REUSE_MATRIX; 5011f4ddd8eeSStefano Zampini } 5012f4ddd8eeSStefano Zampini } 5013f4ddd8eeSStefano Zampini /* last check */ 5014d1e9a80fSBarry Smith if (pc->flag == DIFFERENT_NONZERO_PATTERN) { 5015f4ddd8eeSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5016f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5017f4ddd8eeSStefano Zampini } 5018f4ddd8eeSStefano Zampini } else { /* first time, so we need to create the matrix */ 5019f4ddd8eeSStefano Zampini reuse = MAT_INITIAL_MATRIX; 5020f4ddd8eeSStefano Zampini } 5021a00504b5SStefano Zampini /* convert pcbddc->local_mat if needed later in PCBDDCSetUpCorrection */ 5022af732b37SStefano Zampini ierr = MatGetBlockSize(pcbddc->local_mat,&mbs);CHKERRQ(ierr); 5023af732b37SStefano Zampini ierr = ISGetBlockSize(pcbddc->is_R_local,&ibs);CHKERRQ(ierr); 502404708bb6SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcbddc->local_mat,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr); 502504708bb6SStefano Zampini if (ibs != mbs) { /* need to convert to SEQAIJ to extract any submatrix with is_R_local */ 502604708bb6SStefano Zampini if (matis->A == pcbddc->local_mat) { 502704708bb6SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 502804708bb6SStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 5029af732b37SStefano Zampini } else { 5030511c6705SHong Zhang ierr = MatConvert(pcbddc->local_mat,MATSEQAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 50316816873aSStefano Zampini } 503204708bb6SStefano Zampini } else if (issbaij) { /* need to convert to BAIJ to get offdiagonal blocks */ 503304708bb6SStefano Zampini if (matis->A == pcbddc->local_mat) { 503404708bb6SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 503504708bb6SStefano Zampini ierr = MatConvert(matis->A,MATSEQBAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 503604708bb6SStefano Zampini } else { 5037511c6705SHong Zhang ierr = MatConvert(pcbddc->local_mat,MATSEQBAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 503804708bb6SStefano Zampini } 503904708bb6SStefano Zampini } 5040a00504b5SStefano Zampini /* extract A_RR */ 50410aa714b2SStefano Zampini if (reuse_neumann_solver) { 5042a00504b5SStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5043a00504b5SStefano Zampini 5044a00504b5SStefano Zampini if (pcbddc->dbg_flag) { /* we need A_RR to test the solver later */ 504516e386b8SStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5046a00504b5SStefano Zampini if (reuse_solver->benign_n) { /* we are not using the explicit change of basis on the pressures */ 504716e386b8SStefano Zampini ierr = PCBDDCBenignProject(pc,pcbddc->is_R_local,pcbddc->is_R_local,&A_RR);CHKERRQ(ierr); 504816e386b8SStefano Zampini } else { 50497dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,pcbddc->is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 5050a00504b5SStefano Zampini } 5051a00504b5SStefano Zampini } else { 5052a00504b5SStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5053a00504b5SStefano Zampini ierr = PCGetOperators(reuse_solver->correction_solver,&A_RR,NULL);CHKERRQ(ierr); 5054a00504b5SStefano Zampini ierr = PetscObjectReference((PetscObject)A_RR);CHKERRQ(ierr); 5055a00504b5SStefano Zampini } 5056a00504b5SStefano Zampini } else { /* we have to build the neumann solver, so we need to extract the relevant matrix */ 50577dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->local_mat,pcbddc->is_R_local,pcbddc->is_R_local,reuse,&A_RR);CHKERRQ(ierr); 505816e386b8SStefano Zampini } 50593301b35fSStefano Zampini if (pcbddc->local_mat->symmetric_set) { 50603301b35fSStefano Zampini ierr = MatSetOption(A_RR,MAT_SYMMETRIC,pcbddc->local_mat->symmetric_set);CHKERRQ(ierr); 50616816873aSStefano Zampini } 5062f4ddd8eeSStefano Zampini if (!pcbddc->ksp_R) { /* create object if not present */ 5063304d26faSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 5064304d26faSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 5065304d26faSStefano Zampini /* default */ 5066304d26faSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 5067e604994aSStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,neu_prefix);CHKERRQ(ierr); 5068304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 50699577ea80SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)A_RR,MATSEQSBAIJ,&issbaij);CHKERRQ(ierr); 50709577ea80SStefano Zampini if (issbaij) { 50719577ea80SStefano Zampini ierr = PCSetType(pc_temp,PCCHOLESKY);CHKERRQ(ierr); 50729577ea80SStefano Zampini } else { 5073304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 50749577ea80SStefano Zampini } 5075304d26faSStefano Zampini /* Allow user's customization */ 5076304d26faSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 5077304d26faSStefano Zampini ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr); 5078304d26faSStefano Zampini } 5079304d26faSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero. TODO solve from umfpack interface */ 5080304d26faSStefano Zampini if (!n_R) { 5081304d26faSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 5082304d26faSStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 5083304d26faSStefano Zampini } 50845cbda25cSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR);CHKERRQ(ierr); 5085df4d28bfSStefano Zampini /* Reuse solver if it is present */ 50860aa714b2SStefano Zampini if (reuse_neumann_solver) { 5087df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5088d62866d3SStefano Zampini 5089df4d28bfSStefano Zampini ierr = KSPSetPC(pcbddc->ksp_R,reuse_solver->correction_solver);CHKERRQ(ierr); 5090d62866d3SStefano Zampini } 5091304d26faSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 5092304d26faSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 5093684f6988SStefano Zampini } 5094304d26faSStefano Zampini 5095684f6988SStefano Zampini if (pcbddc->dbg_flag) { 5096684f6988SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 50971575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 5098684f6988SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 5099684f6988SStefano Zampini } 5100c7017625SStefano Zampini 5101c7017625SStefano Zampini /* adapt Dirichlet and Neumann solvers if a nullspace correction has been requested */ 5102c7017625SStefano Zampini check_corr[0] = check_corr[1] = PETSC_FALSE; 5103c7017625SStefano Zampini if (pcbddc->NullSpace_corr[0]) { 5104c7017625SStefano Zampini ierr = PCBDDCSetUseExactDirichlet(pc,PETSC_FALSE);CHKERRQ(ierr); 5105c7017625SStefano Zampini } 5106c7017625SStefano Zampini if (dirichlet && pcbddc->NullSpace_corr[0] && !pcbddc->switch_static) { 5107c7017625SStefano Zampini check_corr[0] = PETSC_TRUE; 5108c7017625SStefano Zampini ierr = PCBDDCNullSpaceAssembleCorrection(pc,PETSC_TRUE,pcbddc->NullSpace_corr[1]);CHKERRQ(ierr); 5109c7017625SStefano Zampini } 5110c7017625SStefano Zampini if (neumann && pcbddc->NullSpace_corr[2]) { 5111c7017625SStefano Zampini check_corr[1] = PETSC_TRUE; 5112c7017625SStefano Zampini ierr = PCBDDCNullSpaceAssembleCorrection(pc,PETSC_FALSE,pcbddc->NullSpace_corr[3]);CHKERRQ(ierr); 5113c7017625SStefano Zampini } 5114c7017625SStefano Zampini 5115c7017625SStefano Zampini /* check Dirichlet and Neumann solvers */ 5116c7017625SStefano Zampini if (pcbddc->dbg_flag) { 5117684f6988SStefano Zampini if (dirichlet) { /* Dirichlet */ 51180fccc4e9SStefano Zampini ierr = VecSetRandom(pcis->vec1_D,NULL);CHKERRQ(ierr); 51190fccc4e9SStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 51200fccc4e9SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,pcis->vec2_D);CHKERRQ(ierr); 51210fccc4e9SStefano Zampini ierr = VecAXPY(pcis->vec1_D,m_one,pcis->vec2_D);CHKERRQ(ierr); 51220fccc4e9SStefano Zampini ierr = VecNorm(pcis->vec1_D,NORM_INFINITY,&value);CHKERRQ(ierr); 5123e604994aSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d infinity error for Dirichlet solve (%s) = % 1.14e \n",PetscGlobalRank,((PetscObject)(pcbddc->ksp_D))->prefix,value);CHKERRQ(ierr); 5124c7017625SStefano Zampini if (check_corr[0]) { 5125c7017625SStefano Zampini ierr = PCBDDCNullSpaceCheckCorrection(pc,PETSC_TRUE);CHKERRQ(ierr); 5126c7017625SStefano Zampini } 5127304d26faSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 5128304d26faSStefano Zampini } 5129684f6988SStefano Zampini if (neumann) { /* Neumann */ 51300fccc4e9SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,NULL);CHKERRQ(ierr); 51310fccc4e9SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 51320fccc4e9SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 51330fccc4e9SStefano Zampini ierr = VecAXPY(pcbddc->vec1_R,m_one,pcbddc->vec2_R);CHKERRQ(ierr); 51340fccc4e9SStefano Zampini ierr = VecNorm(pcbddc->vec1_R,NORM_INFINITY,&value);CHKERRQ(ierr); 5135e604994aSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d infinity error for Neumann solve (%s) = % 1.14e\n",PetscGlobalRank,((PetscObject)(pcbddc->ksp_R))->prefix,value);CHKERRQ(ierr); 5136c7017625SStefano Zampini if (check_corr[1]) { 5137c7017625SStefano Zampini ierr = PCBDDCNullSpaceCheckCorrection(pc,PETSC_FALSE);CHKERRQ(ierr); 5138c7017625SStefano Zampini } 5139304d26faSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 5140304d26faSStefano Zampini } 5141684f6988SStefano Zampini } 51425cbda25cSStefano Zampini /* free Neumann problem's matrix */ 51435cbda25cSStefano Zampini ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 5144304d26faSStefano Zampini PetscFunctionReturn(0); 5145304d26faSStefano Zampini } 5146304d26faSStefano Zampini 514780677318SStefano Zampini static PetscErrorCode PCBDDCSolveSubstructureCorrection(PC pc, Vec inout_B, Vec inout_D, PetscBool applytranspose) 5148674ae819SStefano Zampini { 5149674ae819SStefano Zampini PetscErrorCode ierr; 5150674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 5151be83ff47SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 5152b334f244SStefano Zampini PetscBool reuse_solver = sub_schurs ? ( sub_schurs->reuse_solver ? PETSC_TRUE : PETSC_FALSE ) : PETSC_FALSE; 5153674ae819SStefano Zampini 5154674ae819SStefano Zampini PetscFunctionBegin; 5155b334f244SStefano Zampini if (!reuse_solver) { 515680677318SStefano Zampini ierr = VecSet(pcbddc->vec1_R,0.);CHKERRQ(ierr); 515720c7b377SStefano Zampini } 515880677318SStefano Zampini if (!pcbddc->switch_static) { 515980677318SStefano Zampini if (applytranspose && pcbddc->local_auxmat1) { 516080677318SStefano Zampini ierr = MatMultTranspose(pcbddc->local_auxmat2,inout_B,pcbddc->vec1_C);CHKERRQ(ierr); 516180677318SStefano Zampini ierr = MatMultTransposeAdd(pcbddc->local_auxmat1,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr); 516220c7b377SStefano Zampini } 5163b334f244SStefano Zampini if (!reuse_solver) { 516480677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 516580677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 516620c7b377SStefano Zampini } else { 5167df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5168be83ff47SStefano Zampini 5169df4d28bfSStefano Zampini ierr = VecScatterBegin(reuse_solver->correction_scatter_B,inout_B,reuse_solver->rhs_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5170df4d28bfSStefano Zampini ierr = VecScatterEnd(reuse_solver->correction_scatter_B,inout_B,reuse_solver->rhs_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 517120c7b377SStefano Zampini } 5172be83ff47SStefano Zampini } else { 517380677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517480677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517580677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,inout_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517680677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,inout_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 517780677318SStefano Zampini if (applytranspose && pcbddc->local_auxmat1) { 517880677318SStefano Zampini ierr = MatMultTranspose(pcbddc->local_auxmat2,pcbddc->vec1_R,pcbddc->vec1_C);CHKERRQ(ierr); 517980677318SStefano Zampini ierr = MatMultTransposeAdd(pcbddc->local_auxmat1,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr); 518080677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 518180677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,inout_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5182674ae819SStefano Zampini } 5183674ae819SStefano Zampini } 5184b334f244SStefano Zampini if (!reuse_solver || pcbddc->switch_static) { 518580677318SStefano Zampini if (applytranspose) { 518680677318SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 518780677318SStefano Zampini } else { 518880677318SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 518980677318SStefano Zampini } 5190be83ff47SStefano Zampini } else { 5191df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5192be83ff47SStefano Zampini 5193be83ff47SStefano Zampini if (applytranspose) { 5194df4d28bfSStefano Zampini ierr = MatFactorSolveSchurComplementTranspose(reuse_solver->F,reuse_solver->rhs_B,reuse_solver->sol_B);CHKERRQ(ierr); 5195be83ff47SStefano Zampini } else { 5196df4d28bfSStefano Zampini ierr = MatFactorSolveSchurComplement(reuse_solver->F,reuse_solver->rhs_B,reuse_solver->sol_B);CHKERRQ(ierr); 5197be83ff47SStefano Zampini } 5198be83ff47SStefano Zampini } 519980677318SStefano Zampini ierr = VecSet(inout_B,0.);CHKERRQ(ierr); 520080677318SStefano Zampini if (!pcbddc->switch_static) { 5201b334f244SStefano Zampini if (!reuse_solver) { 520280677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 520380677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5204be83ff47SStefano Zampini } else { 5205df4d28bfSStefano Zampini PCBDDCReuseSolvers reuse_solver = sub_schurs->reuse_solver; 5206be83ff47SStefano Zampini 5207df4d28bfSStefano Zampini ierr = VecScatterBegin(reuse_solver->correction_scatter_B,reuse_solver->sol_B,inout_B,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5208df4d28bfSStefano Zampini ierr = VecScatterEnd(reuse_solver->correction_scatter_B,reuse_solver->sol_B,inout_B,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5209be83ff47SStefano Zampini } 521080677318SStefano Zampini if (!applytranspose && pcbddc->local_auxmat1) { 521180677318SStefano Zampini ierr = MatMult(pcbddc->local_auxmat1,inout_B,pcbddc->vec1_C);CHKERRQ(ierr); 521280677318SStefano Zampini ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,inout_B,inout_B);CHKERRQ(ierr); 521380677318SStefano Zampini } 521480677318SStefano Zampini } else { 521580677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521680677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521780677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521880677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521980677318SStefano Zampini if (!applytranspose && pcbddc->local_auxmat1) { 522080677318SStefano Zampini ierr = MatMult(pcbddc->local_auxmat1,inout_B,pcbddc->vec1_C);CHKERRQ(ierr); 522180677318SStefano Zampini ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 522280677318SStefano Zampini } 522380677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 522480677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,inout_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 522580677318SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 522680677318SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,inout_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5227674ae819SStefano Zampini } 5228674ae819SStefano Zampini PetscFunctionReturn(0); 5229674ae819SStefano Zampini } 5230674ae819SStefano Zampini 5231dc359a40SStefano Zampini /* parameter apply transpose determines if the interface preconditioner should be applied transposed or not */ 5232dc359a40SStefano Zampini PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc, PetscBool applytranspose) 5233674ae819SStefano Zampini { 5234674ae819SStefano Zampini PetscErrorCode ierr; 5235674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 5236674ae819SStefano Zampini PC_IS* pcis = (PC_IS*) (pc->data); 5237674ae819SStefano Zampini const PetscScalar zero = 0.0; 5238674ae819SStefano Zampini 5239674ae819SStefano Zampini PetscFunctionBegin; 5240dc359a40SStefano Zampini /* Application of PSI^T or PHI^T (depending on applytranspose, see comment above) */ 52414fee134fSStefano Zampini if (!pcbddc->benign_apply_coarse_only) { 5242dc359a40SStefano Zampini if (applytranspose) { 5243674ae819SStefano Zampini ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 52448eeda7d8SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 5245dc359a40SStefano Zampini } else { 5246674ae819SStefano Zampini ierr = MatMultTranspose(pcbddc->coarse_psi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 5247674ae819SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultTransposeAdd(pcbddc->coarse_psi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 524815aaf578SStefano Zampini } 52494fee134fSStefano Zampini } else { 52504fee134fSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 52514fee134fSStefano Zampini } 5252efc2fbd9SStefano Zampini 5253efc2fbd9SStefano Zampini /* add p0 to the last value of vec1_P holding the coarse dof relative to p0 */ 52544f1b2e48SStefano Zampini if (pcbddc->benign_n) { 5255efc2fbd9SStefano Zampini PetscScalar *array; 52564f1b2e48SStefano Zampini PetscInt j; 5257efc2fbd9SStefano Zampini 5258efc2fbd9SStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 52594f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) array[pcbddc->local_primal_size-pcbddc->benign_n+j] += pcbddc->benign_p0[j]; 5260efc2fbd9SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 5261efc2fbd9SStefano Zampini } 5262efc2fbd9SStefano Zampini 526312edc857SStefano Zampini /* start communications from local primal nodes to rhs of coarse solver */ 526412edc857SStefano Zampini ierr = VecSet(pcbddc->coarse_vec,zero);CHKERRQ(ierr); 526512edc857SStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 526612edc857SStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 526712edc857SStefano Zampini 52689f00e9b4SStefano Zampini /* Coarse solution -> rhs and sol updated inside PCBDDCScattarCoarseDataBegin/End */ 526912edc857SStefano Zampini if (pcbddc->coarse_ksp) { 527051694757SStefano Zampini Mat coarse_mat; 5271964fefecSStefano Zampini Vec rhs,sol; 527251694757SStefano Zampini MatNullSpace nullsp; 527327b6a85dSStefano Zampini PetscBool isbddc = PETSC_FALSE; 5274964fefecSStefano Zampini 527527b6a85dSStefano Zampini if (pcbddc->benign_have_null) { 527627b6a85dSStefano Zampini PC coarse_pc; 527727b6a85dSStefano Zampini 527827b6a85dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr); 527927b6a85dSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)coarse_pc,PCBDDC,&isbddc);CHKERRQ(ierr); 528027b6a85dSStefano Zampini /* we need to propagate to coarser levels the need for a possible benign correction */ 528127b6a85dSStefano Zampini if (isbddc && pcbddc->benign_apply_coarse_only && !pcbddc->benign_skip_correction) { 528227b6a85dSStefano Zampini PC_BDDC* coarsepcbddc = (PC_BDDC*)(coarse_pc->data); 528327b6a85dSStefano Zampini coarsepcbddc->benign_skip_correction = PETSC_FALSE; 52843bca92a6SStefano Zampini coarsepcbddc->benign_apply_coarse_only = PETSC_TRUE; 528527b6a85dSStefano Zampini } 528627b6a85dSStefano Zampini } 5287964fefecSStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&rhs);CHKERRQ(ierr); 5288964fefecSStefano Zampini ierr = KSPGetSolution(pcbddc->coarse_ksp,&sol);CHKERRQ(ierr); 528951694757SStefano Zampini ierr = KSPGetOperators(pcbddc->coarse_ksp,&coarse_mat,NULL);CHKERRQ(ierr); 529051694757SStefano Zampini ierr = MatGetNullSpace(coarse_mat,&nullsp);CHKERRQ(ierr); 529151694757SStefano Zampini if (nullsp) { 529251694757SStefano Zampini ierr = MatNullSpaceRemove(nullsp,rhs);CHKERRQ(ierr); 529351694757SStefano Zampini } 529412edc857SStefano Zampini if (applytranspose) { 52959a962809SStefano Zampini if (pcbddc->benign_apply_coarse_only) SETERRQ(PetscObjectComm((PetscObject)pcbddc->coarse_ksp),PETSC_ERR_SUP,"Not yet implemented"); 5296964fefecSStefano Zampini ierr = KSPSolveTranspose(pcbddc->coarse_ksp,rhs,sol);CHKERRQ(ierr); 52972701bc32SStefano Zampini } else { 52981f4df5f7SStefano Zampini if (pcbddc->benign_apply_coarse_only && isbddc) { /* need just to apply the coarse preconditioner during presolve */ 52992701bc32SStefano Zampini PC coarse_pc; 53002701bc32SStefano Zampini 53012701bc32SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr); 53022701bc32SStefano Zampini ierr = PCPreSolve(coarse_pc,pcbddc->coarse_ksp);CHKERRQ(ierr); 53033e589ea0SStefano Zampini ierr = PCBDDCBenignRemoveInterior(coarse_pc,rhs,sol);CHKERRQ(ierr); 53042701bc32SStefano Zampini ierr = PCPostSolve(coarse_pc,pcbddc->coarse_ksp);CHKERRQ(ierr); 530512edc857SStefano Zampini } else { 5306964fefecSStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,rhs,sol);CHKERRQ(ierr); 530712edc857SStefano Zampini } 53082701bc32SStefano Zampini } 53091d82a3b6SStefano Zampini /* we don't need the benign correction at coarser levels anymore */ 531027b6a85dSStefano Zampini if (pcbddc->benign_have_null && isbddc) { 531127b6a85dSStefano Zampini PC coarse_pc; 531227b6a85dSStefano Zampini PC_BDDC* coarsepcbddc; 531327b6a85dSStefano Zampini 531427b6a85dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&coarse_pc);CHKERRQ(ierr); 531527b6a85dSStefano Zampini coarsepcbddc = (PC_BDDC*)(coarse_pc->data); 531627b6a85dSStefano Zampini coarsepcbddc->benign_skip_correction = PETSC_TRUE; 53173bca92a6SStefano Zampini coarsepcbddc->benign_apply_coarse_only = PETSC_FALSE; 531827b6a85dSStefano Zampini } 531951694757SStefano Zampini if (nullsp) { 532051694757SStefano Zampini ierr = MatNullSpaceRemove(nullsp,sol);CHKERRQ(ierr); 532151694757SStefano Zampini } 532212edc857SStefano Zampini } 5323674ae819SStefano Zampini 5324674ae819SStefano Zampini /* Local solution on R nodes */ 53254fee134fSStefano Zampini if (pcis->n && !pcbddc->benign_apply_coarse_only) { 532680677318SStefano Zampini ierr = PCBDDCSolveSubstructureCorrection(pc,pcis->vec1_B,pcis->vec1_D,applytranspose);CHKERRQ(ierr); 53279f00e9b4SStefano Zampini } 53289f00e9b4SStefano Zampini /* communications from coarse sol to local primal nodes */ 53299f00e9b4SStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 533012edc857SStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5331674ae819SStefano Zampini 53324fee134fSStefano Zampini /* Sum contributions from the two levels */ 53334fee134fSStefano Zampini if (!pcbddc->benign_apply_coarse_only) { 5334dc359a40SStefano Zampini if (applytranspose) { 5335dc359a40SStefano Zampini ierr = MatMultAdd(pcbddc->coarse_psi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 5336dc359a40SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultAdd(pcbddc->coarse_psi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 5337dc359a40SStefano Zampini } else { 5338674ae819SStefano Zampini ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 53398eeda7d8SStefano Zampini if (pcbddc->switch_static) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 5340dc359a40SStefano Zampini } 5341efc2fbd9SStefano Zampini /* store p0 */ 53424f1b2e48SStefano Zampini if (pcbddc->benign_n) { 5343efc2fbd9SStefano Zampini PetscScalar *array; 53444f1b2e48SStefano Zampini PetscInt j; 5345efc2fbd9SStefano Zampini 5346efc2fbd9SStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 53474f1b2e48SStefano Zampini for (j=0;j<pcbddc->benign_n;j++) pcbddc->benign_p0[j] = array[pcbddc->local_primal_size-pcbddc->benign_n+j]; 5348efc2fbd9SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 5349efc2fbd9SStefano Zampini } 53504fee134fSStefano Zampini } else { /* expand the coarse solution */ 53514fee134fSStefano Zampini if (applytranspose) { 53524fee134fSStefano Zampini ierr = MatMult(pcbddc->coarse_psi_B,pcbddc->vec1_P,pcis->vec1_B);CHKERRQ(ierr); 53534fee134fSStefano Zampini } else { 53544fee134fSStefano Zampini ierr = MatMult(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B);CHKERRQ(ierr); 53554fee134fSStefano Zampini } 53564fee134fSStefano Zampini } 5357674ae819SStefano Zampini PetscFunctionReturn(0); 5358674ae819SStefano Zampini } 5359674ae819SStefano Zampini 536012edc857SStefano Zampini PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,InsertMode imode, ScatterMode smode) 5361674ae819SStefano Zampini { 5362674ae819SStefano Zampini PetscErrorCode ierr; 5363674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 536458da7f69SStefano Zampini PetscScalar *array; 536512edc857SStefano Zampini Vec from,to; 5366674ae819SStefano Zampini 5367674ae819SStefano Zampini PetscFunctionBegin; 536812edc857SStefano Zampini if (smode == SCATTER_REVERSE) { /* from global to local -> get data from coarse solution */ 536912edc857SStefano Zampini from = pcbddc->coarse_vec; 537012edc857SStefano Zampini to = pcbddc->vec1_P; 537112edc857SStefano Zampini if (pcbddc->coarse_ksp) { /* get array from coarse processes */ 537212edc857SStefano Zampini Vec tvec; 537358da7f69SStefano Zampini 537458da7f69SStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr); 537558da7f69SStefano Zampini ierr = VecResetArray(tvec);CHKERRQ(ierr); 537612edc857SStefano Zampini ierr = KSPGetSolution(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr); 537758da7f69SStefano Zampini ierr = VecGetArray(tvec,&array);CHKERRQ(ierr); 537858da7f69SStefano Zampini ierr = VecPlaceArray(from,array);CHKERRQ(ierr); 537958da7f69SStefano Zampini ierr = VecRestoreArray(tvec,&array);CHKERRQ(ierr); 538012edc857SStefano Zampini } 538112edc857SStefano Zampini } else { /* from local to global -> put data in coarse right hand side */ 538212edc857SStefano Zampini from = pcbddc->vec1_P; 538312edc857SStefano Zampini to = pcbddc->coarse_vec; 538412edc857SStefano Zampini } 538512edc857SStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,from,to,imode,smode);CHKERRQ(ierr); 5386674ae819SStefano Zampini PetscFunctionReturn(0); 5387674ae819SStefano Zampini } 5388674ae819SStefano Zampini 538912edc857SStefano Zampini PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc, InsertMode imode, ScatterMode smode) 5390674ae819SStefano Zampini { 5391674ae819SStefano Zampini PetscErrorCode ierr; 5392674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 539358da7f69SStefano Zampini PetscScalar *array; 539412edc857SStefano Zampini Vec from,to; 5395674ae819SStefano Zampini 5396674ae819SStefano Zampini PetscFunctionBegin; 539712edc857SStefano Zampini if (smode == SCATTER_REVERSE) { /* from global to local -> get data from coarse solution */ 539812edc857SStefano Zampini from = pcbddc->coarse_vec; 539912edc857SStefano Zampini to = pcbddc->vec1_P; 540012edc857SStefano Zampini } else { /* from local to global -> put data in coarse right hand side */ 540112edc857SStefano Zampini from = pcbddc->vec1_P; 540212edc857SStefano Zampini to = pcbddc->coarse_vec; 540312edc857SStefano Zampini } 540412edc857SStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,from,to,imode,smode);CHKERRQ(ierr); 540512edc857SStefano Zampini if (smode == SCATTER_FORWARD) { 540612edc857SStefano Zampini if (pcbddc->coarse_ksp) { /* get array from coarse processes */ 540712edc857SStefano Zampini Vec tvec; 540858da7f69SStefano Zampini 540912edc857SStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&tvec);CHKERRQ(ierr); 541058da7f69SStefano Zampini ierr = VecGetArray(to,&array);CHKERRQ(ierr); 541158da7f69SStefano Zampini ierr = VecPlaceArray(tvec,array);CHKERRQ(ierr); 541258da7f69SStefano Zampini ierr = VecRestoreArray(to,&array);CHKERRQ(ierr); 541358da7f69SStefano Zampini } 541458da7f69SStefano Zampini } else { 541558da7f69SStefano Zampini if (pcbddc->coarse_ksp) { /* restore array of pcbddc->coarse_vec */ 541658da7f69SStefano Zampini ierr = VecResetArray(from);CHKERRQ(ierr); 541712edc857SStefano Zampini } 541812edc857SStefano Zampini } 5419674ae819SStefano Zampini PetscFunctionReturn(0); 5420674ae819SStefano Zampini } 5421674ae819SStefano Zampini 5422984c4197SStefano Zampini /* uncomment for testing purposes */ 5423984c4197SStefano Zampini /* #define PETSC_MISSING_LAPACK_GESVD 1 */ 5424674ae819SStefano Zampini PetscErrorCode PCBDDCConstraintsSetUp(PC pc) 5425674ae819SStefano Zampini { 5426674ae819SStefano Zampini PetscErrorCode ierr; 5427674ae819SStefano Zampini PC_IS* pcis = (PC_IS*)(pc->data); 5428674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 5429674ae819SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 5430984c4197SStefano Zampini /* one and zero */ 5431984c4197SStefano Zampini PetscScalar one=1.0,zero=0.0; 5432984c4197SStefano Zampini /* space to store constraints and their local indices */ 54339162d606SStefano Zampini PetscScalar *constraints_data; 54349162d606SStefano Zampini PetscInt *constraints_idxs,*constraints_idxs_B; 54359162d606SStefano Zampini PetscInt *constraints_idxs_ptr,*constraints_data_ptr; 54369162d606SStefano Zampini PetscInt *constraints_n; 5437984c4197SStefano Zampini /* iterators */ 5438b3d85658SStefano Zampini PetscInt i,j,k,total_counts,total_counts_cc,cum; 5439984c4197SStefano Zampini /* BLAS integers */ 5440e310c8b4SStefano Zampini PetscBLASInt lwork,lierr; 5441e310c8b4SStefano Zampini PetscBLASInt Blas_N,Blas_M,Blas_K,Blas_one=1; 5442c4303822SStefano Zampini PetscBLASInt Blas_LDA,Blas_LDB,Blas_LDC; 5443727cdba6SStefano Zampini /* reuse */ 54440e6343abSStefano Zampini PetscInt olocal_primal_size,olocal_primal_size_cc; 54450e6343abSStefano Zampini PetscInt *olocal_primal_ref_node,*olocal_primal_ref_mult; 5446984c4197SStefano Zampini /* change of basis */ 5447b3d85658SStefano Zampini PetscBool qr_needed; 54489162d606SStefano Zampini PetscBT change_basis,qr_needed_idx; 5449984c4197SStefano Zampini /* auxiliary stuff */ 545064efe560SStefano Zampini PetscInt *nnz,*is_indices; 54518a0068c3SStefano Zampini PetscInt ncc; 5452984c4197SStefano Zampini /* some quantities */ 545345a1bb75SStefano Zampini PetscInt n_vertices,total_primal_vertices,valid_constraints; 5454a58a30b4SStefano Zampini PetscInt size_of_constraint,max_size_of_constraint=0,max_constraints,temp_constraints; 5455984c4197SStefano Zampini 5456674ae819SStefano Zampini PetscFunctionBegin; 54578e61c736SStefano Zampini /* Destroy Mat objects computed previously */ 54588e61c736SStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 54598e61c736SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 546016909a7fSStefano Zampini ierr = MatDestroy(&pcbddc->switch_static_change);CHKERRQ(ierr); 5461088faed8SStefano Zampini /* save info on constraints from previous setup (if any) */ 5462088faed8SStefano Zampini olocal_primal_size = pcbddc->local_primal_size; 54630e6343abSStefano Zampini olocal_primal_size_cc = pcbddc->local_primal_size_cc; 54640e6343abSStefano Zampini ierr = PetscMalloc2(olocal_primal_size_cc,&olocal_primal_ref_node,olocal_primal_size_cc,&olocal_primal_ref_mult);CHKERRQ(ierr); 54650e6343abSStefano Zampini ierr = PetscMemcpy(olocal_primal_ref_node,pcbddc->local_primal_ref_node,olocal_primal_size_cc*sizeof(PetscInt));CHKERRQ(ierr); 54660e6343abSStefano Zampini ierr = PetscMemcpy(olocal_primal_ref_mult,pcbddc->local_primal_ref_mult,olocal_primal_size_cc*sizeof(PetscInt));CHKERRQ(ierr); 54670e6343abSStefano Zampini ierr = PetscFree2(pcbddc->local_primal_ref_node,pcbddc->local_primal_ref_mult);CHKERRQ(ierr); 5468088faed8SStefano Zampini ierr = PetscFree(pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 5469cf5a6209SStefano Zampini 5470cf5a6209SStefano Zampini if (!pcbddc->adaptive_selection) { 54719162d606SStefano Zampini IS ISForVertices,*ISForFaces,*ISForEdges; 5472cf5a6209SStefano Zampini MatNullSpace nearnullsp; 5473cf5a6209SStefano Zampini const Vec *nearnullvecs; 5474cf5a6209SStefano Zampini Vec *localnearnullsp; 5475cf5a6209SStefano Zampini PetscScalar *array; 5476cf5a6209SStefano Zampini PetscInt n_ISForFaces,n_ISForEdges,nnsp_size; 5477cf5a6209SStefano Zampini PetscBool nnsp_has_cnst; 5478674ae819SStefano Zampini /* LAPACK working arrays for SVD or POD */ 5479b3d85658SStefano Zampini PetscBool skip_lapack,boolforchange; 5480674ae819SStefano Zampini PetscScalar *work; 5481674ae819SStefano Zampini PetscReal *singular_vals; 5482674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5483674ae819SStefano Zampini PetscReal *rwork; 5484674ae819SStefano Zampini #endif 5485674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5486674ae819SStefano Zampini PetscScalar *temp_basis,*correlation_mat; 5487674ae819SStefano Zampini #else 5488964fefecSStefano Zampini PetscBLASInt dummy_int=1; 5489964fefecSStefano Zampini PetscScalar dummy_scalar=1.; 5490674ae819SStefano Zampini #endif 5491674ae819SStefano Zampini 5492674ae819SStefano Zampini /* Get index sets for faces, edges and vertices from graph */ 5493d06fc5fdSStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,&n_ISForFaces,&ISForFaces,&n_ISForEdges,&ISForEdges,&ISForVertices);CHKERRQ(ierr); 5494e4d548c7SStefano Zampini /* print some info */ 54955c643e28SStefano Zampini if (pcbddc->dbg_flag && (!pcbddc->sub_schurs || pcbddc->sub_schurs_rebuild)) { 5496e4d548c7SStefano Zampini PetscInt nv; 5497e4d548c7SStefano Zampini 5498c8272957SStefano Zampini ierr = PCBDDCGraphASCIIView(pcbddc->mat_graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr); 5499e4d548c7SStefano Zampini ierr = ISGetSize(ISForVertices,&nv);CHKERRQ(ierr); 5500e4d548c7SStefano Zampini ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 5501e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 5502e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate vertices (%d)\n",PetscGlobalRank,nv,pcbddc->use_vertices);CHKERRQ(ierr); 5503e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate edges (%d)\n",PetscGlobalRank,n_ISForEdges,pcbddc->use_edges);CHKERRQ(ierr); 5504e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate faces (%d)\n",PetscGlobalRank,n_ISForFaces,pcbddc->use_faces);CHKERRQ(ierr); 5505e4d548c7SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 5506e4d548c7SStefano Zampini ierr = PetscViewerASCIIPopSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 5507e4d548c7SStefano Zampini } 5508e4d548c7SStefano Zampini 5509d06fc5fdSStefano Zampini /* free unneeded index sets */ 5510d06fc5fdSStefano Zampini if (!pcbddc->use_vertices) { 5511d06fc5fdSStefano Zampini ierr = ISDestroy(&ISForVertices);CHKERRQ(ierr); 5512674ae819SStefano Zampini } 5513d06fc5fdSStefano Zampini if (!pcbddc->use_edges) { 5514d06fc5fdSStefano Zampini for (i=0;i<n_ISForEdges;i++) { 5515d06fc5fdSStefano Zampini ierr = ISDestroy(&ISForEdges[i]);CHKERRQ(ierr); 5516d06fc5fdSStefano Zampini } 5517d06fc5fdSStefano Zampini ierr = PetscFree(ISForEdges);CHKERRQ(ierr); 5518d06fc5fdSStefano Zampini n_ISForEdges = 0; 5519d06fc5fdSStefano Zampini } 5520d06fc5fdSStefano Zampini if (!pcbddc->use_faces) { 5521d06fc5fdSStefano Zampini for (i=0;i<n_ISForFaces;i++) { 5522d06fc5fdSStefano Zampini ierr = ISDestroy(&ISForFaces[i]);CHKERRQ(ierr); 5523d06fc5fdSStefano Zampini } 5524d06fc5fdSStefano Zampini ierr = PetscFree(ISForFaces);CHKERRQ(ierr); 5525d06fc5fdSStefano Zampini n_ISForFaces = 0; 5526d06fc5fdSStefano Zampini } 552770022509SStefano Zampini 5528674ae819SStefano Zampini /* check if near null space is attached to global mat */ 5529674ae819SStefano Zampini ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 5530674ae819SStefano Zampini if (nearnullsp) { 5531674ae819SStefano Zampini ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 5532f4ddd8eeSStefano Zampini /* remove any stored info */ 5533f4ddd8eeSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->onearnullspace);CHKERRQ(ierr); 5534f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->onearnullvecs_state);CHKERRQ(ierr); 5535f4ddd8eeSStefano Zampini /* store information for BDDC solver reuse */ 5536f4ddd8eeSStefano Zampini ierr = PetscObjectReference((PetscObject)nearnullsp);CHKERRQ(ierr); 5537f4ddd8eeSStefano Zampini pcbddc->onearnullspace = nearnullsp; 5538473ba861SJed Brown ierr = PetscMalloc1(nnsp_size,&pcbddc->onearnullvecs_state);CHKERRQ(ierr); 5539f4ddd8eeSStefano Zampini for (i=0;i<nnsp_size;i++) { 5540f4ddd8eeSStefano Zampini ierr = PetscObjectStateGet((PetscObject)nearnullvecs[i],&pcbddc->onearnullvecs_state[i]);CHKERRQ(ierr); 5541f4ddd8eeSStefano Zampini } 5542984c4197SStefano Zampini } else { /* if near null space is not provided BDDC uses constants by default */ 5543984c4197SStefano Zampini nnsp_size = 0; 5544674ae819SStefano Zampini nnsp_has_cnst = PETSC_TRUE; 5545674ae819SStefano Zampini } 5546984c4197SStefano Zampini /* get max number of constraints on a single cc */ 5547984c4197SStefano Zampini max_constraints = nnsp_size; 5548984c4197SStefano Zampini if (nnsp_has_cnst) max_constraints++; 5549984c4197SStefano Zampini 5550674ae819SStefano Zampini /* 5551674ae819SStefano Zampini Evaluate maximum storage size needed by the procedure 55529162d606SStefano Zampini - Indices for connected component i stored at "constraints_idxs + constraints_idxs_ptr[i]" 55539162d606SStefano Zampini - Values for constraints on connected component i stored at "constraints_data + constraints_data_ptr[i]" 55549162d606SStefano Zampini There can be multiple constraints per connected component 5555674ae819SStefano Zampini */ 5556674ae819SStefano Zampini n_vertices = 0; 5557674ae819SStefano Zampini if (ISForVertices) { 5558674ae819SStefano Zampini ierr = ISGetSize(ISForVertices,&n_vertices);CHKERRQ(ierr); 5559674ae819SStefano Zampini } 55609162d606SStefano Zampini ncc = n_vertices+n_ISForFaces+n_ISForEdges; 55619162d606SStefano Zampini ierr = PetscMalloc3(ncc+1,&constraints_idxs_ptr,ncc+1,&constraints_data_ptr,ncc,&constraints_n);CHKERRQ(ierr); 55629162d606SStefano Zampini 55639162d606SStefano Zampini total_counts = n_ISForFaces+n_ISForEdges; 55649162d606SStefano Zampini total_counts *= max_constraints; 5565674ae819SStefano Zampini total_counts += n_vertices; 55664641a718SStefano Zampini ierr = PetscBTCreate(total_counts,&change_basis);CHKERRQ(ierr); 55679162d606SStefano Zampini 5568674ae819SStefano Zampini total_counts = 0; 5569674ae819SStefano Zampini max_size_of_constraint = 0; 5570674ae819SStefano Zampini for (i=0;i<n_ISForEdges+n_ISForFaces;i++) { 55719162d606SStefano Zampini IS used_is; 5572674ae819SStefano Zampini if (i<n_ISForEdges) { 55739162d606SStefano Zampini used_is = ISForEdges[i]; 5574674ae819SStefano Zampini } else { 55759162d606SStefano Zampini used_is = ISForFaces[i-n_ISForEdges]; 5576674ae819SStefano Zampini } 55779162d606SStefano Zampini ierr = ISGetSize(used_is,&j);CHKERRQ(ierr); 5578674ae819SStefano Zampini total_counts += j; 5579674ae819SStefano Zampini max_size_of_constraint = PetscMax(j,max_size_of_constraint); 5580674ae819SStefano Zampini } 55819162d606SStefano Zampini ierr = PetscMalloc3(total_counts*max_constraints+n_vertices,&constraints_data,total_counts+n_vertices,&constraints_idxs,total_counts+n_vertices,&constraints_idxs_B);CHKERRQ(ierr); 55829162d606SStefano Zampini 5583984c4197SStefano Zampini /* get local part of global near null space vectors */ 5584785e854fSJed Brown ierr = PetscMalloc1(nnsp_size,&localnearnullsp);CHKERRQ(ierr); 5585984c4197SStefano Zampini for (k=0;k<nnsp_size;k++) { 5586984c4197SStefano Zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 5587e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5588e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5589984c4197SStefano Zampini } 5590674ae819SStefano Zampini 5591242a89d7SStefano Zampini /* whether or not to skip lapack calls */ 5592242a89d7SStefano Zampini skip_lapack = PETSC_TRUE; 5593a773dcb8SStefano Zampini if (n_ISForFaces+n_ISForEdges && max_constraints > 1 && !pcbddc->use_nnsp_true) skip_lapack = PETSC_FALSE; 5594242a89d7SStefano Zampini 5595984c4197SStefano Zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd (or LAPACKsyev if SVD is missing) */ 5596a773dcb8SStefano Zampini if (!skip_lapack) { 5597674ae819SStefano Zampini PetscScalar temp_work; 5598911cabfeSStefano Zampini 5599674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5600984c4197SStefano Zampini /* Proper Orthogonal Decomposition (POD) using the snapshot method */ 5601785e854fSJed Brown ierr = PetscMalloc1(max_constraints*max_constraints,&correlation_mat);CHKERRQ(ierr); 5602785e854fSJed Brown ierr = PetscMalloc1(max_constraints,&singular_vals);CHKERRQ(ierr); 5603785e854fSJed Brown ierr = PetscMalloc1(max_size_of_constraint*max_constraints,&temp_basis);CHKERRQ(ierr); 5604674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5605785e854fSJed Brown ierr = PetscMalloc1(3*max_constraints,&rwork);CHKERRQ(ierr); 5606674ae819SStefano Zampini #endif 5607674ae819SStefano Zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 5608c8244a33SStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_N);CHKERRQ(ierr); 5609c8244a33SStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_LDA);CHKERRQ(ierr); 5610674ae819SStefano Zampini lwork = -1; 5611674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5612674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 5613c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,&temp_work,&lwork,&lierr)); 5614674ae819SStefano Zampini #else 5615c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,&temp_work,&lwork,rwork,&lierr)); 5616674ae819SStefano Zampini #endif 5617674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5618984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEV Lapack routine %d",(int)lierr); 5619674ae819SStefano Zampini #else /* on missing GESVD */ 5620674ae819SStefano Zampini /* SVD */ 5621674ae819SStefano Zampini PetscInt max_n,min_n; 5622674ae819SStefano Zampini max_n = max_size_of_constraint; 5623984c4197SStefano Zampini min_n = max_constraints; 5624984c4197SStefano Zampini if (max_size_of_constraint < max_constraints) { 5625674ae819SStefano Zampini min_n = max_size_of_constraint; 5626984c4197SStefano Zampini max_n = max_constraints; 5627674ae819SStefano Zampini } 5628785e854fSJed Brown ierr = PetscMalloc1(min_n,&singular_vals);CHKERRQ(ierr); 5629674ae819SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5630785e854fSJed Brown ierr = PetscMalloc1(5*min_n,&rwork);CHKERRQ(ierr); 5631674ae819SStefano Zampini #endif 5632674ae819SStefano Zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 5633674ae819SStefano Zampini lwork = -1; 5634e310c8b4SStefano Zampini ierr = PetscBLASIntCast(max_n,&Blas_M);CHKERRQ(ierr); 5635e310c8b4SStefano Zampini ierr = PetscBLASIntCast(min_n,&Blas_N);CHKERRQ(ierr); 5636b7d8b9f8SStefano Zampini ierr = PetscBLASIntCast(max_n,&Blas_LDA);CHKERRQ(ierr); 5637674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5638674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 56399162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,&constraints_data[0],&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr)); 5640674ae819SStefano Zampini #else 56419162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,&constraints_data[0],&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr)); 5642674ae819SStefano Zampini #endif 5643674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5644984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GESVD Lapack routine %d",(int)lierr); 5645984c4197SStefano Zampini #endif /* on missing GESVD */ 5646674ae819SStefano Zampini /* Allocate optimal workspace */ 5647674ae819SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work),&lwork);CHKERRQ(ierr); 5648854ce69bSBarry Smith ierr = PetscMalloc1(lwork,&work);CHKERRQ(ierr); 5649674ae819SStefano Zampini } 5650674ae819SStefano Zampini /* Now we can loop on constraining sets */ 5651674ae819SStefano Zampini total_counts = 0; 56529162d606SStefano Zampini constraints_idxs_ptr[0] = 0; 56539162d606SStefano Zampini constraints_data_ptr[0] = 0; 5654674ae819SStefano Zampini /* vertices */ 56559162d606SStefano Zampini if (n_vertices) { 5656674ae819SStefano Zampini ierr = ISGetIndices(ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 56579162d606SStefano Zampini ierr = PetscMemcpy(constraints_idxs,is_indices,n_vertices*sizeof(PetscInt));CHKERRQ(ierr); 5658674ae819SStefano Zampini for (i=0;i<n_vertices;i++) { 56599162d606SStefano Zampini constraints_n[total_counts] = 1; 56609162d606SStefano Zampini constraints_data[total_counts] = 1.0; 56619162d606SStefano Zampini constraints_idxs_ptr[total_counts+1] = constraints_idxs_ptr[total_counts]+1; 56629162d606SStefano Zampini constraints_data_ptr[total_counts+1] = constraints_data_ptr[total_counts]+1; 5663674ae819SStefano Zampini total_counts++; 5664674ae819SStefano Zampini } 5665674ae819SStefano Zampini ierr = ISRestoreIndices(ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5666674ae819SStefano Zampini n_vertices = total_counts; 5667674ae819SStefano Zampini } 5668984c4197SStefano Zampini 5669674ae819SStefano Zampini /* edges and faces */ 56709162d606SStefano Zampini total_counts_cc = total_counts; 5671911cabfeSStefano Zampini for (ncc=0;ncc<n_ISForEdges+n_ISForFaces;ncc++) { 56729162d606SStefano Zampini IS used_is; 56739162d606SStefano Zampini PetscBool idxs_copied = PETSC_FALSE; 56749162d606SStefano Zampini 5675911cabfeSStefano Zampini if (ncc<n_ISForEdges) { 56769162d606SStefano Zampini used_is = ISForEdges[ncc]; 5677984c4197SStefano Zampini boolforchange = pcbddc->use_change_of_basis; /* change or not the basis on the edge */ 5678674ae819SStefano Zampini } else { 56799162d606SStefano Zampini used_is = ISForFaces[ncc-n_ISForEdges]; 5680984c4197SStefano Zampini boolforchange = (PetscBool)(pcbddc->use_change_of_basis && pcbddc->use_change_on_faces); /* change or not the basis on the face */ 5681674ae819SStefano Zampini } 5682674ae819SStefano Zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 56839162d606SStefano Zampini 56849162d606SStefano Zampini ierr = ISGetSize(used_is,&size_of_constraint);CHKERRQ(ierr); 56859162d606SStefano Zampini ierr = ISGetIndices(used_is,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5686984c4197SStefano Zampini /* change of basis should not be performed on local periodic nodes */ 5687984c4197SStefano Zampini if (pcbddc->mat_graph->mirrors && pcbddc->mat_graph->mirrors[is_indices[0]]) boolforchange = PETSC_FALSE; 5688674ae819SStefano Zampini if (nnsp_has_cnst) { 56895b08dc53SStefano Zampini PetscScalar quad_value; 56909162d606SStefano Zampini 56919162d606SStefano Zampini ierr = PetscMemcpy(constraints_idxs + constraints_idxs_ptr[total_counts_cc],is_indices,size_of_constraint*sizeof(PetscInt));CHKERRQ(ierr); 56929162d606SStefano Zampini idxs_copied = PETSC_TRUE; 56939162d606SStefano Zampini 5694a773dcb8SStefano Zampini if (!pcbddc->use_nnsp_true) { 5695674ae819SStefano Zampini quad_value = (PetscScalar)(1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 5696a773dcb8SStefano Zampini } else { 5697a773dcb8SStefano Zampini quad_value = 1.0; 5698a773dcb8SStefano Zampini } 5699674ae819SStefano Zampini for (j=0;j<size_of_constraint;j++) { 57009162d606SStefano Zampini constraints_data[constraints_data_ptr[total_counts_cc]+j] = quad_value; 5701674ae819SStefano Zampini } 57029162d606SStefano Zampini temp_constraints++; 5703674ae819SStefano Zampini total_counts++; 5704674ae819SStefano Zampini } 5705674ae819SStefano Zampini for (k=0;k<nnsp_size;k++) { 5706984c4197SStefano Zampini PetscReal real_value; 57079162d606SStefano Zampini PetscScalar *ptr_to_data; 57089162d606SStefano Zampini 5709984c4197SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array);CHKERRQ(ierr); 57109162d606SStefano Zampini ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]+temp_constraints*size_of_constraint]; 5711674ae819SStefano Zampini for (j=0;j<size_of_constraint;j++) { 57129162d606SStefano Zampini ptr_to_data[j] = array[is_indices[j]]; 5713674ae819SStefano Zampini } 5714984c4197SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array);CHKERRQ(ierr); 5715984c4197SStefano Zampini /* check if array is null on the connected component */ 5716e310c8b4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 57179162d606SStefano Zampini PetscStackCallBLAS("BLASasum",real_value = BLASasum_(&Blas_N,ptr_to_data,&Blas_one)); 57185b08dc53SStefano Zampini if (real_value > 0.0) { /* keep indices and values */ 5719674ae819SStefano Zampini temp_constraints++; 5720674ae819SStefano Zampini total_counts++; 57219162d606SStefano Zampini if (!idxs_copied) { 57229162d606SStefano Zampini ierr = PetscMemcpy(constraints_idxs + constraints_idxs_ptr[total_counts_cc],is_indices,size_of_constraint*sizeof(PetscInt));CHKERRQ(ierr); 57239162d606SStefano Zampini idxs_copied = PETSC_TRUE; 5724674ae819SStefano Zampini } 5725674ae819SStefano Zampini } 57269162d606SStefano Zampini } 57279162d606SStefano Zampini ierr = ISRestoreIndices(used_is,(const PetscInt**)&is_indices);CHKERRQ(ierr); 572845a1bb75SStefano Zampini valid_constraints = temp_constraints; 5729eb97c9d2SStefano Zampini if (!pcbddc->use_nnsp_true && temp_constraints) { 5730a773dcb8SStefano Zampini if (temp_constraints == 1) { /* just normalize the constraint */ 57319162d606SStefano Zampini PetscScalar norm,*ptr_to_data; 57329162d606SStefano Zampini 57339162d606SStefano Zampini ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]]; 5734a773dcb8SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 57359162d606SStefano Zampini PetscStackCallBLAS("BLASdot",norm = BLASdot_(&Blas_N,ptr_to_data,&Blas_one,ptr_to_data,&Blas_one)); 5736a773dcb8SStefano Zampini norm = 1.0/PetscSqrtReal(PetscRealPart(norm)); 57379162d606SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&Blas_N,&norm,ptr_to_data,&Blas_one)); 5738a773dcb8SStefano Zampini } else { /* perform SVD */ 5739984c4197SStefano Zampini PetscReal tol = 1.0e-8; /* tolerance for retaining eigenmodes */ 57409162d606SStefano Zampini PetscScalar *ptr_to_data = &constraints_data[constraints_data_ptr[total_counts_cc]]; 5741674ae819SStefano Zampini 5742674ae819SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5743984c4197SStefano Zampini /* SVD: Y = U*S*V^H -> U (eigenvectors of Y*Y^H) = Y*V*(S)^\dag 5744984c4197SStefano Zampini POD: Y^H*Y = V*D*V^H, D = S^H*S -> U = Y*V*D^(-1/2) 5745984c4197SStefano Zampini -> When PETSC_USE_COMPLEX and PETSC_MISSING_LAPACK_GESVD are defined 5746984c4197SStefano Zampini the constraints basis will differ (by a complex factor with absolute value equal to 1) 5747984c4197SStefano Zampini from that computed using LAPACKgesvd 5748984c4197SStefano Zampini -> This is due to a different computation of eigenvectors in LAPACKheev 5749984c4197SStefano Zampini -> The quality of the POD-computed basis will be the same */ 5750984c4197SStefano Zampini ierr = PetscMemzero(correlation_mat,temp_constraints*temp_constraints*sizeof(PetscScalar));CHKERRQ(ierr); 5751674ae819SStefano Zampini /* Store upper triangular part of correlation matrix */ 5752e310c8b4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 5753984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5754674ae819SStefano Zampini for (j=0;j<temp_constraints;j++) { 5755674ae819SStefano Zampini for (k=0;k<j+1;k++) { 57569162d606SStefano Zampini PetscStackCallBLAS("BLASdot",correlation_mat[j*temp_constraints+k] = BLASdot_(&Blas_N,ptr_to_data+k*size_of_constraint,&Blas_one,ptr_to_data+j*size_of_constraint,&Blas_one)); 5757674ae819SStefano Zampini } 5758674ae819SStefano Zampini } 5759e310c8b4SStefano Zampini /* compute eigenvalues and eigenvectors of correlation matrix */ 5760e310c8b4SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr); 5761e310c8b4SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_LDA);CHKERRQ(ierr); 5762674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 5763c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,work,&lwork,&lierr)); 5764674ae819SStefano Zampini #else 5765c8244a33SStefano Zampini PetscStackCallBLAS("LAPACKsyev",LAPACKsyev_("V","U",&Blas_N,correlation_mat,&Blas_LDA,singular_vals,work,&lwork,rwork,&lierr)); 5766674ae819SStefano Zampini #endif 5767674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5768984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEV Lapack routine %d",(int)lierr); 5769984c4197SStefano Zampini /* retain eigenvalues greater than tol: note that LAPACKsyev gives eigs in ascending order */ 5770674ae819SStefano Zampini j = 0; 5771984c4197SStefano Zampini while (j < temp_constraints && singular_vals[j] < tol) j++; 5772674ae819SStefano Zampini total_counts = total_counts-j; 577345a1bb75SStefano Zampini valid_constraints = temp_constraints-j; 5774e310c8b4SStefano Zampini /* scale and copy POD basis into used quadrature memory */ 5775c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 5776c4303822SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr); 5777c4303822SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_K);CHKERRQ(ierr); 5778c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 5779c4303822SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_LDB);CHKERRQ(ierr); 5780c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDC);CHKERRQ(ierr); 5781674ae819SStefano Zampini if (j<temp_constraints) { 5782984c4197SStefano Zampini PetscInt ii; 5783984c4197SStefano Zampini for (k=j;k<temp_constraints;k++) singular_vals[k] = 1.0/PetscSqrtReal(singular_vals[k]); 5784674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 57859162d606SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&Blas_M,&Blas_N,&Blas_K,&one,ptr_to_data,&Blas_LDA,correlation_mat,&Blas_LDB,&zero,temp_basis,&Blas_LDC)); 5786674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5787984c4197SStefano Zampini for (k=0;k<temp_constraints-j;k++) { 5788674ae819SStefano Zampini for (ii=0;ii<size_of_constraint;ii++) { 57899162d606SStefano Zampini ptr_to_data[k*size_of_constraint+ii] = singular_vals[temp_constraints-1-k]*temp_basis[(temp_constraints-1-k)*size_of_constraint+ii]; 5790674ae819SStefano Zampini } 5791674ae819SStefano Zampini } 5792674ae819SStefano Zampini } 5793674ae819SStefano Zampini #else /* on missing GESVD */ 5794e310c8b4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 5795e310c8b4SStefano Zampini ierr = PetscBLASIntCast(temp_constraints,&Blas_N);CHKERRQ(ierr); 5796b7d8b9f8SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 5797674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5798674ae819SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 57999162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,ptr_to_data,&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr)); 5800674ae819SStefano Zampini #else 58019162d606SStefano Zampini PetscStackCallBLAS("LAPACKgesvd",LAPACKgesvd_("O","N",&Blas_M,&Blas_N,ptr_to_data,&Blas_LDA,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr)); 5802674ae819SStefano Zampini #endif 5803984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESVD Lapack routine %d",(int)lierr); 5804674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 5805984c4197SStefano Zampini /* retain eigenvalues greater than tol: note that LAPACKgesvd gives eigs in descending order */ 5806e310c8b4SStefano Zampini k = temp_constraints; 5807e310c8b4SStefano Zampini if (k > size_of_constraint) k = size_of_constraint; 5808674ae819SStefano Zampini j = 0; 5809e310c8b4SStefano Zampini while (j < k && singular_vals[k-j-1] < tol) j++; 581045a1bb75SStefano Zampini valid_constraints = k-j; 5811911cabfeSStefano Zampini total_counts = total_counts-temp_constraints+valid_constraints; 5812984c4197SStefano Zampini #endif /* on missing GESVD */ 5813674ae819SStefano Zampini } 5814a773dcb8SStefano Zampini } 58159162d606SStefano Zampini /* update pointers information */ 58169162d606SStefano Zampini if (valid_constraints) { 58179162d606SStefano Zampini constraints_n[total_counts_cc] = valid_constraints; 58189162d606SStefano Zampini constraints_idxs_ptr[total_counts_cc+1] = constraints_idxs_ptr[total_counts_cc]+size_of_constraint; 58199162d606SStefano Zampini constraints_data_ptr[total_counts_cc+1] = constraints_data_ptr[total_counts_cc]+size_of_constraint*valid_constraints; 58209162d606SStefano Zampini /* set change_of_basis flag */ 582145a1bb75SStefano Zampini if (boolforchange) { 5822b3d85658SStefano Zampini PetscBTSet(change_basis,total_counts_cc); 58239162d606SStefano Zampini } 5824b3d85658SStefano Zampini total_counts_cc++; 582545a1bb75SStefano Zampini } 582645a1bb75SStefano Zampini } 5827984c4197SStefano Zampini /* free workspace */ 58288f1c130eSStefano Zampini if (!skip_lapack) { 5829984c4197SStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 5830984c4197SStefano Zampini #if defined(PETSC_USE_COMPLEX) 5831984c4197SStefano Zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 5832984c4197SStefano Zampini #endif 5833984c4197SStefano Zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 5834984c4197SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 5835984c4197SStefano Zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 5836984c4197SStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 5837984c4197SStefano Zampini #endif 5838984c4197SStefano Zampini } 5839984c4197SStefano Zampini for (k=0;k<nnsp_size;k++) { 5840984c4197SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 5841984c4197SStefano Zampini } 5842984c4197SStefano Zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 5843cf5a6209SStefano Zampini /* free index sets of faces, edges and vertices */ 5844cf5a6209SStefano Zampini for (i=0;i<n_ISForFaces;i++) { 5845cf5a6209SStefano Zampini ierr = ISDestroy(&ISForFaces[i]);CHKERRQ(ierr); 5846cf5a6209SStefano Zampini } 5847cf5a6209SStefano Zampini if (n_ISForFaces) { 5848cf5a6209SStefano Zampini ierr = PetscFree(ISForFaces);CHKERRQ(ierr); 5849cf5a6209SStefano Zampini } 5850cf5a6209SStefano Zampini for (i=0;i<n_ISForEdges;i++) { 5851cf5a6209SStefano Zampini ierr = ISDestroy(&ISForEdges[i]);CHKERRQ(ierr); 5852cf5a6209SStefano Zampini } 5853cf5a6209SStefano Zampini if (n_ISForEdges) { 5854cf5a6209SStefano Zampini ierr = PetscFree(ISForEdges);CHKERRQ(ierr); 5855cf5a6209SStefano Zampini } 5856cf5a6209SStefano Zampini ierr = ISDestroy(&ISForVertices);CHKERRQ(ierr); 585708122e43SStefano Zampini } else { 585808122e43SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 5859984c4197SStefano Zampini 586008122e43SStefano Zampini total_counts = 0; 586108122e43SStefano Zampini n_vertices = 0; 5862d62866d3SStefano Zampini if (sub_schurs->is_vertices && pcbddc->use_vertices) { 5863d62866d3SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_vertices,&n_vertices);CHKERRQ(ierr); 586408122e43SStefano Zampini } 586508122e43SStefano Zampini max_constraints = 0; 58669162d606SStefano Zampini total_counts_cc = 0; 586708122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs+n_vertices;i++) { 586808122e43SStefano Zampini total_counts += pcbddc->adaptive_constraints_n[i]; 58699162d606SStefano Zampini if (pcbddc->adaptive_constraints_n[i]) total_counts_cc++; 587008122e43SStefano Zampini max_constraints = PetscMax(max_constraints,pcbddc->adaptive_constraints_n[i]); 587108122e43SStefano Zampini } 58729162d606SStefano Zampini constraints_idxs_ptr = pcbddc->adaptive_constraints_idxs_ptr; 58739162d606SStefano Zampini constraints_data_ptr = pcbddc->adaptive_constraints_data_ptr; 58749162d606SStefano Zampini constraints_idxs = pcbddc->adaptive_constraints_idxs; 58759162d606SStefano Zampini constraints_data = pcbddc->adaptive_constraints_data; 587674d5cdf7SStefano Zampini /* constraints_n differs from pcbddc->adaptive_constraints_n */ 58779162d606SStefano Zampini ierr = PetscMalloc1(total_counts_cc,&constraints_n);CHKERRQ(ierr); 58789162d606SStefano Zampini total_counts_cc = 0; 58799162d606SStefano Zampini for (i=0;i<sub_schurs->n_subs+n_vertices;i++) { 58809162d606SStefano Zampini if (pcbddc->adaptive_constraints_n[i]) { 58819162d606SStefano Zampini constraints_n[total_counts_cc++] = pcbddc->adaptive_constraints_n[i]; 588208122e43SStefano Zampini } 588308122e43SStefano Zampini } 58849162d606SStefano Zampini #if 0 58859162d606SStefano Zampini printf("Found %d totals (%d)\n",total_counts_cc,total_counts); 58869162d606SStefano Zampini for (i=0;i<total_counts_cc;i++) { 58879162d606SStefano Zampini printf("const %d, start %d",i,constraints_idxs_ptr[i]); 58889162d606SStefano Zampini printf(" end %d:\n",constraints_idxs_ptr[i+1]); 58899162d606SStefano Zampini for (j=constraints_idxs_ptr[i];j<constraints_idxs_ptr[i+1];j++) { 58909162d606SStefano Zampini printf(" %d",constraints_idxs[j]); 58919162d606SStefano Zampini } 58929162d606SStefano Zampini printf("\n"); 58939162d606SStefano Zampini printf("number of cc: %d\n",constraints_n[i]); 58949162d606SStefano Zampini } 58951b968477SStefano Zampini for (i=0;i<n_vertices;i++) { 58968bec7fa6SStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] vertex %d, n %d\n",PetscGlobalRank,i,pcbddc->adaptive_constraints_n[i]); 58971b968477SStefano Zampini } 58981b968477SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 58998bec7fa6SStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] sub %d, edge %d, n %d\n",PetscGlobalRank,i,(PetscBool)PetscBTLookup(sub_schurs->is_edge,i),pcbddc->adaptive_constraints_n[i+n_vertices]); 59001b968477SStefano Zampini } 590108122e43SStefano Zampini #endif 590208122e43SStefano Zampini 59038bec7fa6SStefano Zampini max_size_of_constraint = 0; 59049162d606SStefano Zampini for (i=0;i<total_counts_cc;i++) max_size_of_constraint = PetscMax(max_size_of_constraint,constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]); 59059162d606SStefano Zampini ierr = PetscMalloc1(constraints_idxs_ptr[total_counts_cc],&constraints_idxs_B);CHKERRQ(ierr); 590608122e43SStefano Zampini /* Change of basis */ 5907b3d85658SStefano Zampini ierr = PetscBTCreate(total_counts_cc,&change_basis);CHKERRQ(ierr); 590808122e43SStefano Zampini if (pcbddc->use_change_of_basis) { 590908122e43SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 591008122e43SStefano Zampini if (PetscBTLookup(sub_schurs->is_edge,i) || pcbddc->use_change_on_faces) { 5911b3d85658SStefano Zampini ierr = PetscBTSet(change_basis,i+n_vertices);CHKERRQ(ierr); 591208122e43SStefano Zampini } 591308122e43SStefano Zampini } 591408122e43SStefano Zampini } 591508122e43SStefano Zampini } 5916984c4197SStefano Zampini pcbddc->local_primal_size = total_counts; 59174f1b2e48SStefano Zampini ierr = PetscMalloc1(pcbddc->local_primal_size+pcbddc->benign_n,&pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 591808122e43SStefano Zampini 59199162d606SStefano Zampini /* map constraints_idxs in boundary numbering */ 59209162d606SStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,constraints_idxs_ptr[total_counts_cc],constraints_idxs,&i,constraints_idxs_B);CHKERRQ(ierr); 5921eee23b56SStefano Zampini if (i != constraints_idxs_ptr[total_counts_cc]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for constraints indices %D != %D\n",constraints_idxs_ptr[total_counts_cc],i); 5922674ae819SStefano Zampini 5923674ae819SStefano Zampini /* Create constraint matrix */ 5924674ae819SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 592516f15bc4SStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,MATAIJ);CHKERRQ(ierr); 5926984c4197SStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,pcbddc->local_primal_size,pcis->n,pcbddc->local_primal_size,pcis->n);CHKERRQ(ierr); 5927984c4197SStefano Zampini 5928984c4197SStefano Zampini /* find primal_dofs: subdomain corners plus dofs selected as primal after change of basis */ 5929a717540cSStefano Zampini /* determine if a QR strategy is needed for change of basis */ 5930a717540cSStefano Zampini qr_needed = PETSC_FALSE; 593174d5cdf7SStefano Zampini ierr = PetscBTCreate(total_counts_cc,&qr_needed_idx);CHKERRQ(ierr); 5932984c4197SStefano Zampini total_primal_vertices=0; 5933b3d85658SStefano Zampini pcbddc->local_primal_size_cc = 0; 59349162d606SStefano Zampini for (i=0;i<total_counts_cc;i++) { 59359162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 593672b8c272SStefano Zampini if (size_of_constraint == 1 && pcbddc->mat_graph->custom_minimal_size) { 59379162d606SStefano Zampini pcbddc->primal_indices_local_idxs[total_primal_vertices++] = constraints_idxs[constraints_idxs_ptr[i]]; 5938b3d85658SStefano Zampini pcbddc->local_primal_size_cc += 1; 593964efe560SStefano Zampini } else if (PetscBTLookup(change_basis,i)) { 59409162d606SStefano Zampini for (k=0;k<constraints_n[i];k++) { 59419162d606SStefano Zampini pcbddc->primal_indices_local_idxs[total_primal_vertices++] = constraints_idxs[constraints_idxs_ptr[i]+k]; 5942a717540cSStefano Zampini } 5943b3d85658SStefano Zampini pcbddc->local_primal_size_cc += constraints_n[i]; 594491af6908SStefano Zampini if (constraints_n[i] > 1 || pcbddc->use_qr_single) { 5945a717540cSStefano Zampini PetscBTSet(qr_needed_idx,i); 5946a717540cSStefano Zampini qr_needed = PETSC_TRUE; 5947a717540cSStefano Zampini } 5948fa434743SStefano Zampini } else { 5949b3d85658SStefano Zampini pcbddc->local_primal_size_cc += 1; 5950fa434743SStefano Zampini } 5951a717540cSStefano Zampini } 5952b371cd4fSStefano Zampini /* note that the local variable n_vertices used below stores the number of pointwise constraints */ 5953b371cd4fSStefano Zampini pcbddc->n_vertices = total_primal_vertices; 5954674ae819SStefano Zampini /* permute indices in order to have a sorted set of vertices */ 595570022509SStefano Zampini ierr = PetscSortInt(total_primal_vertices,pcbddc->primal_indices_local_idxs);CHKERRQ(ierr); 59564f1b2e48SStefano Zampini ierr = PetscMalloc2(pcbddc->local_primal_size_cc+pcbddc->benign_n,&pcbddc->local_primal_ref_node,pcbddc->local_primal_size_cc+pcbddc->benign_n,&pcbddc->local_primal_ref_mult);CHKERRQ(ierr); 59570e6343abSStefano Zampini ierr = PetscMemcpy(pcbddc->local_primal_ref_node,pcbddc->primal_indices_local_idxs,total_primal_vertices*sizeof(PetscInt));CHKERRQ(ierr); 59580e6343abSStefano Zampini for (i=0;i<total_primal_vertices;i++) pcbddc->local_primal_ref_mult[i] = 1; 5959984c4197SStefano Zampini 5960984c4197SStefano Zampini /* nonzero structure of constraint matrix */ 596174d5cdf7SStefano Zampini /* and get reference dof for local constraints */ 5962785e854fSJed Brown ierr = PetscMalloc1(pcbddc->local_primal_size,&nnz);CHKERRQ(ierr); 5963984c4197SStefano Zampini for (i=0;i<total_primal_vertices;i++) nnz[i] = 1; 596474d5cdf7SStefano Zampini 5965984c4197SStefano Zampini j = total_primal_vertices; 596674d5cdf7SStefano Zampini total_counts = total_primal_vertices; 5967b3d85658SStefano Zampini cum = total_primal_vertices; 59689162d606SStefano Zampini for (i=n_vertices;i<total_counts_cc;i++) { 59694641a718SStefano Zampini if (!PetscBTLookup(change_basis,i)) { 5970b3d85658SStefano Zampini pcbddc->local_primal_ref_node[cum] = constraints_idxs[constraints_idxs_ptr[i]]; 5971b3d85658SStefano Zampini pcbddc->local_primal_ref_mult[cum] = constraints_n[i]; 5972b3d85658SStefano Zampini cum++; 59739162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 597474d5cdf7SStefano Zampini for (k=0;k<constraints_n[i];k++) { 597574d5cdf7SStefano Zampini pcbddc->primal_indices_local_idxs[total_counts++] = constraints_idxs[constraints_idxs_ptr[i]+k]; 597674d5cdf7SStefano Zampini nnz[j+k] = size_of_constraint; 597774d5cdf7SStefano Zampini } 59789162d606SStefano Zampini j += constraints_n[i]; 5979674ae819SStefano Zampini } 5980674ae819SStefano Zampini } 5981674ae819SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 5982674ae819SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 5983088faed8SStefano Zampini 5984674ae819SStefano Zampini /* set values in constraint matrix */ 5985984c4197SStefano Zampini for (i=0;i<total_primal_vertices;i++) { 59860e6343abSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,pcbddc->local_primal_ref_node[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 5987674ae819SStefano Zampini } 5988984c4197SStefano Zampini total_counts = total_primal_vertices; 59899162d606SStefano Zampini for (i=n_vertices;i<total_counts_cc;i++) { 59904641a718SStefano Zampini if (!PetscBTLookup(change_basis,i)) { 59919162d606SStefano Zampini PetscInt *cols; 59929162d606SStefano Zampini 59939162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 59949162d606SStefano Zampini cols = constraints_idxs+constraints_idxs_ptr[i]; 59959162d606SStefano Zampini for (k=0;k<constraints_n[i];k++) { 59969162d606SStefano Zampini PetscInt row = total_counts+k; 59979162d606SStefano Zampini PetscScalar *vals; 59989162d606SStefano Zampini 59999162d606SStefano Zampini vals = constraints_data+constraints_data_ptr[i]+k*size_of_constraint; 60009162d606SStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&row,size_of_constraint,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 60019162d606SStefano Zampini } 60029162d606SStefano Zampini total_counts += constraints_n[i]; 6003674ae819SStefano Zampini } 6004674ae819SStefano Zampini } 6005674ae819SStefano Zampini /* assembling */ 6006674ae819SStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6007674ae819SStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6008088faed8SStefano Zampini 6009984c4197SStefano Zampini /* 60106a9046bcSBarry Smith ierr = PetscViewerPushFormat(PETSC_VIEWER_STDOUT_SELF,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 6011984c4197SStefano Zampini ierr = MatView(pcbddc->ConstraintMatrix,(PetscViewer)0);CHKERRQ(ierr); 6012f159cad9SBarry Smith ierr = PetscViewerPopFormat(PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr); 6013984c4197SStefano Zampini */ 6014674ae819SStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->use_change_of_basis is FALSE */ 6015674ae819SStefano Zampini if (pcbddc->use_change_of_basis) { 6016026de310SStefano Zampini /* dual and primal dofs on a single cc */ 6017984c4197SStefano Zampini PetscInt dual_dofs,primal_dofs; 6018984c4197SStefano Zampini /* working stuff for GEQRF */ 601981d9aea3SBarry Smith PetscScalar *qr_basis,*qr_tau = NULL,*qr_work,lqr_work_t; 6020984c4197SStefano Zampini PetscBLASInt lqr_work; 6021984c4197SStefano Zampini /* working stuff for UNGQR */ 6022984c4197SStefano Zampini PetscScalar *gqr_work,lgqr_work_t; 6023984c4197SStefano Zampini PetscBLASInt lgqr_work; 6024984c4197SStefano Zampini /* working stuff for TRTRS */ 6025984c4197SStefano Zampini PetscScalar *trs_rhs; 60263f08241aSStefano Zampini PetscBLASInt Blas_NRHS; 6027984c4197SStefano Zampini /* pointers for values insertion into change of basis matrix */ 6028984c4197SStefano Zampini PetscInt *start_rows,*start_cols; 6029984c4197SStefano Zampini PetscScalar *start_vals; 6030984c4197SStefano Zampini /* working stuff for values insertion */ 60314641a718SStefano Zampini PetscBT is_primal; 603264efe560SStefano Zampini PetscInt *aux_primal_numbering_B; 6033906d46d4SStefano Zampini /* matrix sizes */ 6034906d46d4SStefano Zampini PetscInt global_size,local_size; 6035906d46d4SStefano Zampini /* temporary change of basis */ 6036906d46d4SStefano Zampini Mat localChangeOfBasisMatrix; 6037cf5a6209SStefano Zampini /* extra space for debugging */ 6038cf5a6209SStefano Zampini PetscScalar *dbg_work; 6039984c4197SStefano Zampini 6040906d46d4SStefano Zampini /* local temporary change of basis acts on local interfaces -> dimension is n_B x n_B */ 6041906d46d4SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&localChangeOfBasisMatrix);CHKERRQ(ierr); 604216f15bc4SStefano Zampini ierr = MatSetType(localChangeOfBasisMatrix,MATAIJ);CHKERRQ(ierr); 6043bbb9e6c6SStefano Zampini ierr = MatSetSizes(localChangeOfBasisMatrix,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 6044906d46d4SStefano Zampini /* nonzeros for local mat */ 6045bbb9e6c6SStefano Zampini ierr = PetscMalloc1(pcis->n,&nnz);CHKERRQ(ierr); 60461dd7afcfSStefano Zampini if (!pcbddc->benign_change || pcbddc->fake_change) { 6047bbb9e6c6SStefano Zampini for (i=0;i<pcis->n;i++) nnz[i]=1; 60481dd7afcfSStefano Zampini } else { 60491dd7afcfSStefano Zampini const PetscInt *ii; 60501dd7afcfSStefano Zampini PetscInt n; 60511dd7afcfSStefano Zampini PetscBool flg_row; 60521dd7afcfSStefano Zampini ierr = MatGetRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,NULL,&flg_row);CHKERRQ(ierr); 60531dd7afcfSStefano Zampini for (i=0;i<n;i++) nnz[i] = ii[i+1]-ii[i]; 60541dd7afcfSStefano Zampini ierr = MatRestoreRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,NULL,&flg_row);CHKERRQ(ierr); 60551dd7afcfSStefano Zampini } 60569162d606SStefano Zampini for (i=n_vertices;i<total_counts_cc;i++) { 6057a717540cSStefano Zampini if (PetscBTLookup(change_basis,i)) { 60589162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[i+1]-constraints_idxs_ptr[i]; 6059a717540cSStefano Zampini if (PetscBTLookup(qr_needed_idx,i)) { 60609162d606SStefano Zampini for (j=0;j<size_of_constraint;j++) nnz[constraints_idxs[constraints_idxs_ptr[i]+j]] = size_of_constraint; 6061a717540cSStefano Zampini } else { 60629162d606SStefano Zampini nnz[constraints_idxs[constraints_idxs_ptr[i]]] = size_of_constraint; 60639162d606SStefano Zampini for (j=1;j<size_of_constraint;j++) nnz[constraints_idxs[constraints_idxs_ptr[i]+j]] = 2; 6064a717540cSStefano Zampini } 6065a717540cSStefano Zampini } 6066a717540cSStefano Zampini } 6067906d46d4SStefano Zampini ierr = MatSeqAIJSetPreallocation(localChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 6068bbb9e6c6SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 60691dd7afcfSStefano Zampini /* Set interior change in the matrix */ 60701dd7afcfSStefano Zampini if (!pcbddc->benign_change || pcbddc->fake_change) { 6071bbb9e6c6SStefano Zampini for (i=0;i<pcis->n;i++) { 6072906d46d4SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 6073a717540cSStefano Zampini } 60741dd7afcfSStefano Zampini } else { 60751dd7afcfSStefano Zampini const PetscInt *ii,*jj; 60761dd7afcfSStefano Zampini PetscScalar *aa; 60771dd7afcfSStefano Zampini PetscInt n; 60781dd7afcfSStefano Zampini PetscBool flg_row; 60791dd7afcfSStefano Zampini ierr = MatGetRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&jj,&flg_row);CHKERRQ(ierr); 60801dd7afcfSStefano Zampini ierr = MatSeqAIJGetArray(pcbddc->benign_change,&aa);CHKERRQ(ierr); 60811dd7afcfSStefano Zampini for (i=0;i<n;i++) { 60821dd7afcfSStefano Zampini ierr = MatSetValues(localChangeOfBasisMatrix,1,&i,ii[i+1]-ii[i],jj+ii[i],aa+ii[i],INSERT_VALUES);CHKERRQ(ierr); 60831dd7afcfSStefano Zampini } 60841dd7afcfSStefano Zampini ierr = MatSeqAIJRestoreArray(pcbddc->benign_change,&aa);CHKERRQ(ierr); 60851dd7afcfSStefano Zampini ierr = MatRestoreRowIJ(pcbddc->benign_change,0,PETSC_FALSE,PETSC_FALSE,&n,&ii,&jj,&flg_row);CHKERRQ(ierr); 60861dd7afcfSStefano Zampini } 6087a717540cSStefano Zampini 6088a717540cSStefano Zampini if (pcbddc->dbg_flag) { 6089a717540cSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 6090a717540cSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Checking change of basis computation for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 6091a717540cSStefano Zampini } 6092a717540cSStefano Zampini 6093a717540cSStefano Zampini 6094a717540cSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 6095a717540cSStefano Zampini /* 6096a717540cSStefano Zampini Change of basis matrix is evaluated similarly to the FIRST APPROACH in 6097a717540cSStefano Zampini Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (see Sect 6.2.1) 6098a717540cSStefano Zampini 6099a6b551f4SStefano Zampini Basic blocks of change of basis matrix T computed by 6100a717540cSStefano Zampini 6101a6b551f4SStefano Zampini - Using the following block transformation if there is only a primal dof on the cc (and -pc_bddc_use_qr_single is not specified) 6102a6b551f4SStefano Zampini 6103a6b551f4SStefano Zampini | 1 0 ... 0 s_1/S | 6104a6b551f4SStefano Zampini | 0 1 ... 0 s_2/S | 6105a717540cSStefano Zampini | ... | 6106a6b551f4SStefano Zampini | 0 ... 1 s_{n-1}/S | 6107a6b551f4SStefano Zampini | -s_1/s_n ... -s_{n-1}/s_n s_n/S | 6108a717540cSStefano Zampini 6109a6b551f4SStefano Zampini with S = \sum_{i=1}^n s_i^2 6110a6b551f4SStefano Zampini NOTE: in the above example, the primal dof is the last one of the edge in LOCAL ordering 6111a6b551f4SStefano Zampini in the current implementation, the primal dof is the first one of the edge in GLOBAL ordering 6112a6b551f4SStefano Zampini 6113a6b551f4SStefano Zampini - QR decomposition of constraints otherwise 6114a717540cSStefano Zampini */ 6115a717540cSStefano Zampini if (qr_needed) { 6116984c4197SStefano Zampini /* space to store Q */ 6117854ce69bSBarry Smith ierr = PetscMalloc1(max_size_of_constraint*max_size_of_constraint,&qr_basis);CHKERRQ(ierr); 61184e64d54eSstefano_zampini /* array to store scaling factors for reflectors */ 61194e64d54eSstefano_zampini ierr = PetscMalloc1(max_constraints,&qr_tau);CHKERRQ(ierr); 6120984c4197SStefano Zampini /* first we issue queries for optimal work */ 61213f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_M);CHKERRQ(ierr); 61223f08241aSStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_N);CHKERRQ(ierr); 61233f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6124984c4197SStefano Zampini lqr_work = -1; 61253f08241aSStefano Zampini PetscStackCallBLAS("LAPACKgeqrf",LAPACKgeqrf_(&Blas_M,&Blas_N,qr_basis,&Blas_LDA,qr_tau,&lqr_work_t,&lqr_work,&lierr)); 6126984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GEQRF Lapack routine %d",(int)lierr); 6127984c4197SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lqr_work_t),&lqr_work);CHKERRQ(ierr); 6128785e854fSJed Brown ierr = PetscMalloc1((PetscInt)PetscRealPart(lqr_work_t),&qr_work);CHKERRQ(ierr); 6129984c4197SStefano Zampini lgqr_work = -1; 61303f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_M);CHKERRQ(ierr); 61313f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_N);CHKERRQ(ierr); 61323f08241aSStefano Zampini ierr = PetscBLASIntCast(max_constraints,&Blas_K);CHKERRQ(ierr); 61333f08241aSStefano Zampini ierr = PetscBLASIntCast(max_size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 61343f08241aSStefano Zampini if (Blas_K>Blas_M) Blas_K=Blas_M; /* adjust just for computing optimal work */ 61353f08241aSStefano Zampini PetscStackCallBLAS("LAPACKungqr",LAPACKungqr_(&Blas_M,&Blas_N,&Blas_K,qr_basis,&Blas_LDA,qr_tau,&lgqr_work_t,&lgqr_work,&lierr)); 6136984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to UNGQR Lapack routine %d",(int)lierr); 6137984c4197SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lgqr_work_t),&lgqr_work);CHKERRQ(ierr); 6138785e854fSJed Brown ierr = PetscMalloc1((PetscInt)PetscRealPart(lgqr_work_t),&gqr_work);CHKERRQ(ierr); 6139984c4197SStefano Zampini /* array to store rhs and solution of triangular solver */ 6140785e854fSJed Brown ierr = PetscMalloc1(max_constraints*max_constraints,&trs_rhs);CHKERRQ(ierr); 6141a717540cSStefano Zampini /* allocating workspace for check */ 6142a717540cSStefano Zampini if (pcbddc->dbg_flag) { 6143cf5a6209SStefano Zampini ierr = PetscMalloc1(max_size_of_constraint*(max_constraints+max_size_of_constraint),&dbg_work);CHKERRQ(ierr); 6144a717540cSStefano Zampini } 6145a717540cSStefano Zampini } 6146984c4197SStefano Zampini /* array to store whether a node is primal or not */ 61474641a718SStefano Zampini ierr = PetscBTCreate(pcis->n_B,&is_primal);CHKERRQ(ierr); 6148473ba861SJed Brown ierr = PetscMalloc1(total_primal_vertices,&aux_primal_numbering_B);CHKERRQ(ierr); 61490e6343abSStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,total_primal_vertices,pcbddc->local_primal_ref_node,&i,aux_primal_numbering_B);CHKERRQ(ierr); 6150eee23b56SStefano Zampini if (i != total_primal_vertices) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in boundary numbering for BDDC vertices! %D != %D\n",total_primal_vertices,i); 615139e2fb2aSStefano Zampini for (i=0;i<total_primal_vertices;i++) { 615239e2fb2aSStefano Zampini ierr = PetscBTSet(is_primal,aux_primal_numbering_B[i]);CHKERRQ(ierr); 615339e2fb2aSStefano Zampini } 615439e2fb2aSStefano Zampini ierr = PetscFree(aux_primal_numbering_B);CHKERRQ(ierr); 6155984c4197SStefano Zampini 6156a717540cSStefano Zampini /* loop on constraints and see whether or not they need a change of basis and compute it */ 61579162d606SStefano Zampini for (total_counts=n_vertices;total_counts<total_counts_cc;total_counts++) { 61589162d606SStefano Zampini size_of_constraint = constraints_idxs_ptr[total_counts+1]-constraints_idxs_ptr[total_counts]; 61594641a718SStefano Zampini if (PetscBTLookup(change_basis,total_counts)) { 6160984c4197SStefano Zampini /* get constraint info */ 61619162d606SStefano Zampini primal_dofs = constraints_n[total_counts]; 6162984c4197SStefano Zampini dual_dofs = size_of_constraint-primal_dofs; 6163984c4197SStefano Zampini 6164984c4197SStefano Zampini if (pcbddc->dbg_flag) { 61659162d606SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Constraints %d: %d need a change of basis (size %d)\n",total_counts,primal_dofs,size_of_constraint);CHKERRQ(ierr); 6166674ae819SStefano Zampini } 6167984c4197SStefano Zampini 6168fa434743SStefano Zampini if (PetscBTLookup(qr_needed_idx,total_counts)) { /* QR */ 6169a717540cSStefano Zampini 6170a717540cSStefano Zampini /* copy quadrature constraints for change of basis check */ 6171a717540cSStefano Zampini if (pcbddc->dbg_flag) { 61729162d606SStefano Zampini ierr = PetscMemcpy(dbg_work,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr); 6173a717540cSStefano Zampini } 6174984c4197SStefano Zampini /* copy temporary constraints into larger work vector (in order to store all columns of Q) */ 61759162d606SStefano Zampini ierr = PetscMemcpy(qr_basis,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr); 6176984c4197SStefano Zampini 6177984c4197SStefano Zampini /* compute QR decomposition of constraints */ 61783f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 61793f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr); 61803f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6181674ae819SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 61823f08241aSStefano Zampini PetscStackCallBLAS("LAPACKgeqrf",LAPACKgeqrf_(&Blas_M,&Blas_N,qr_basis,&Blas_LDA,qr_tau,qr_work,&lqr_work,&lierr)); 6183984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GEQRF Lapack routine %d",(int)lierr); 6184674ae819SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6185984c4197SStefano Zampini 6186984c4197SStefano Zampini /* explictly compute R^-T */ 6187984c4197SStefano Zampini ierr = PetscMemzero(trs_rhs,primal_dofs*primal_dofs*sizeof(*trs_rhs));CHKERRQ(ierr); 6188984c4197SStefano Zampini for (j=0;j<primal_dofs;j++) trs_rhs[j*(primal_dofs+1)] = 1.0; 61893f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr); 61903f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_NRHS);CHKERRQ(ierr); 61913f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 61923f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_LDB);CHKERRQ(ierr); 6193984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 61943f08241aSStefano Zampini PetscStackCallBLAS("LAPACKtrtrs",LAPACKtrtrs_("U","T","N",&Blas_N,&Blas_NRHS,qr_basis,&Blas_LDA,trs_rhs,&Blas_LDB,&lierr)); 6195984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in TRTRS Lapack routine %d",(int)lierr); 6196984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6197984c4197SStefano Zampini 6198a717540cSStefano Zampini /* explicitly compute all columns of Q (Q = [Q1 | Q2] ) overwriting QR factorization in qr_basis */ 61993f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 62003f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 62013f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_K);CHKERRQ(ierr); 62023f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6203984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 62043f08241aSStefano Zampini PetscStackCallBLAS("LAPACKungqr",LAPACKungqr_(&Blas_M,&Blas_N,&Blas_K,qr_basis,&Blas_LDA,qr_tau,gqr_work,&lgqr_work,&lierr)); 6205984c4197SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in UNGQR Lapack routine %d",(int)lierr); 6206984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6207984c4197SStefano Zampini 6208984c4197SStefano Zampini /* first primal_dofs columns of Q need to be re-scaled in order to be unitary w.r.t constraints 6209984c4197SStefano Zampini i.e. C_{pxn}*Q_{nxn} should be equal to [I_pxp | 0_pxd] (see check below) 6210984c4197SStefano Zampini where n=size_of_constraint, p=primal_dofs, d=dual_dofs (n=p+d), I and 0 identity and null matrix resp. */ 62113f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_M);CHKERRQ(ierr); 62123f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_N);CHKERRQ(ierr); 62133f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_K);CHKERRQ(ierr); 62143f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 62153f08241aSStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_LDB);CHKERRQ(ierr); 62163f08241aSStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDC);CHKERRQ(ierr); 6217984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 62189162d606SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&Blas_M,&Blas_N,&Blas_K,&one,qr_basis,&Blas_LDA,trs_rhs,&Blas_LDB,&zero,constraints_data+constraints_data_ptr[total_counts],&Blas_LDC)); 6219984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 62209162d606SStefano Zampini ierr = PetscMemcpy(qr_basis,&constraints_data[constraints_data_ptr[total_counts]],size_of_constraint*primal_dofs*sizeof(PetscScalar));CHKERRQ(ierr); 6221984c4197SStefano Zampini 6222984c4197SStefano Zampini /* insert values in change of basis matrix respecting global ordering of new primal dofs */ 62239162d606SStefano Zampini start_rows = &constraints_idxs[constraints_idxs_ptr[total_counts]]; 6224984c4197SStefano Zampini /* insert cols for primal dofs */ 6225984c4197SStefano Zampini for (j=0;j<primal_dofs;j++) { 6226984c4197SStefano Zampini start_vals = &qr_basis[j*size_of_constraint]; 62279162d606SStefano Zampini start_cols = &constraints_idxs[constraints_idxs_ptr[total_counts]+j]; 6228906d46d4SStefano Zampini ierr = MatSetValues(localChangeOfBasisMatrix,size_of_constraint,start_rows,1,start_cols,start_vals,INSERT_VALUES);CHKERRQ(ierr); 6229984c4197SStefano Zampini } 6230984c4197SStefano Zampini /* insert cols for dual dofs */ 6231984c4197SStefano Zampini for (j=0,k=0;j<dual_dofs;k++) { 62329162d606SStefano Zampini if (!PetscBTLookup(is_primal,constraints_idxs_B[constraints_idxs_ptr[total_counts]+k])) { 6233984c4197SStefano Zampini start_vals = &qr_basis[(primal_dofs+j)*size_of_constraint]; 62349162d606SStefano Zampini start_cols = &constraints_idxs[constraints_idxs_ptr[total_counts]+k]; 6235906d46d4SStefano Zampini ierr = MatSetValues(localChangeOfBasisMatrix,size_of_constraint,start_rows,1,start_cols,start_vals,INSERT_VALUES);CHKERRQ(ierr); 6236984c4197SStefano Zampini j++; 6237674ae819SStefano Zampini } 6238674ae819SStefano Zampini } 6239984c4197SStefano Zampini 6240984c4197SStefano Zampini /* check change of basis */ 6241984c4197SStefano Zampini if (pcbddc->dbg_flag) { 6242984c4197SStefano Zampini PetscInt ii,jj; 6243984c4197SStefano Zampini PetscBool valid_qr=PETSC_TRUE; 6244c4303822SStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_M);CHKERRQ(ierr); 6245c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 6246c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_K);CHKERRQ(ierr); 6247c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDA);CHKERRQ(ierr); 6248c4303822SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_LDB);CHKERRQ(ierr); 6249c4303822SStefano Zampini ierr = PetscBLASIntCast(primal_dofs,&Blas_LDC);CHKERRQ(ierr); 6250984c4197SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6251cf5a6209SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&Blas_M,&Blas_N,&Blas_K,&one,dbg_work,&Blas_LDA,qr_basis,&Blas_LDB,&zero,&dbg_work[size_of_constraint*primal_dofs],&Blas_LDC)); 6252984c4197SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 6253984c4197SStefano Zampini for (jj=0;jj<size_of_constraint;jj++) { 6254984c4197SStefano Zampini for (ii=0;ii<primal_dofs;ii++) { 6255cf5a6209SStefano Zampini if (ii != jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]) > 1.e-12) valid_qr = PETSC_FALSE; 6256cf5a6209SStefano Zampini if (ii == jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]-1.0) > 1.e-12) valid_qr = PETSC_FALSE; 6257674ae819SStefano Zampini } 6258674ae819SStefano Zampini } 6259984c4197SStefano Zampini if (!valid_qr) { 626022d5777bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> wrong change of basis!\n");CHKERRQ(ierr); 6261984c4197SStefano Zampini for (jj=0;jj<size_of_constraint;jj++) { 6262984c4197SStefano Zampini for (ii=0;ii<primal_dofs;ii++) { 6263cf5a6209SStefano Zampini if (ii != jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]) > 1.e-12) { 6264cf5a6209SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\tQr basis function %d is not orthogonal to constraint %d (%1.14e)!\n",jj,ii,PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii])); 6265674ae819SStefano Zampini } 6266cf5a6209SStefano Zampini if (ii == jj && PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii]-1.0) > 1.e-12) { 6267cf5a6209SStefano Zampini PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\tQr basis function %d is not unitary w.r.t constraint %d (%1.14e)!\n",jj,ii,PetscAbsScalar(dbg_work[size_of_constraint*primal_dofs+jj*primal_dofs+ii])); 6268984c4197SStefano Zampini } 6269984c4197SStefano Zampini } 6270984c4197SStefano Zampini } 6271674ae819SStefano Zampini } else { 627222d5777bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> right change of basis!\n");CHKERRQ(ierr); 6273674ae819SStefano Zampini } 6274674ae819SStefano Zampini } 6275a717540cSStefano Zampini } else { /* simple transformation block */ 6276a717540cSStefano Zampini PetscInt row,col; 6277a6b551f4SStefano Zampini PetscScalar val,norm; 6278a6b551f4SStefano Zampini 6279a6b551f4SStefano Zampini ierr = PetscBLASIntCast(size_of_constraint,&Blas_N);CHKERRQ(ierr); 62809162d606SStefano Zampini PetscStackCallBLAS("BLASdot",norm = BLASdot_(&Blas_N,constraints_data+constraints_data_ptr[total_counts],&Blas_one,constraints_data+constraints_data_ptr[total_counts],&Blas_one)); 6281a717540cSStefano Zampini for (j=0;j<size_of_constraint;j++) { 62829162d606SStefano Zampini PetscInt row_B = constraints_idxs_B[constraints_idxs_ptr[total_counts]+j]; 62839162d606SStefano Zampini row = constraints_idxs[constraints_idxs_ptr[total_counts]+j]; 6284bbb9e6c6SStefano Zampini if (!PetscBTLookup(is_primal,row_B)) { 62859162d606SStefano Zampini col = constraints_idxs[constraints_idxs_ptr[total_counts]]; 6286906d46d4SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,row,row,1.0,INSERT_VALUES);CHKERRQ(ierr); 62879162d606SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,row,col,constraints_data[constraints_data_ptr[total_counts]+j]/norm,INSERT_VALUES);CHKERRQ(ierr); 6288a717540cSStefano Zampini } else { 6289a717540cSStefano Zampini for (k=0;k<size_of_constraint;k++) { 62909162d606SStefano Zampini col = constraints_idxs[constraints_idxs_ptr[total_counts]+k]; 6291a717540cSStefano Zampini if (row != col) { 62929162d606SStefano Zampini val = -constraints_data[constraints_data_ptr[total_counts]+k]/constraints_data[constraints_data_ptr[total_counts]]; 6293a717540cSStefano Zampini } else { 62949162d606SStefano Zampini val = constraints_data[constraints_data_ptr[total_counts]]/norm; 6295a717540cSStefano Zampini } 6296906d46d4SStefano Zampini ierr = MatSetValue(localChangeOfBasisMatrix,row,col,val,INSERT_VALUES);CHKERRQ(ierr); 6297a717540cSStefano Zampini } 6298a717540cSStefano Zampini } 6299a717540cSStefano Zampini } 630098a51de6SStefano Zampini if (pcbddc->dbg_flag) { 630122d5777bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"\t-> using standard change of basis\n");CHKERRQ(ierr); 6302a717540cSStefano Zampini } 6303674ae819SStefano Zampini } 6304984c4197SStefano Zampini } else { 6305984c4197SStefano Zampini if (pcbddc->dbg_flag) { 63069162d606SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Constraint %d does not need a change of basis (size %d)\n",total_counts,size_of_constraint);CHKERRQ(ierr); 6307674ae819SStefano Zampini } 6308674ae819SStefano Zampini } 6309674ae819SStefano Zampini } 6310a717540cSStefano Zampini 6311a717540cSStefano Zampini /* free workspace */ 6312a717540cSStefano Zampini if (qr_needed) { 6313984c4197SStefano Zampini if (pcbddc->dbg_flag) { 6314cf5a6209SStefano Zampini ierr = PetscFree(dbg_work);CHKERRQ(ierr); 6315984c4197SStefano Zampini } 6316984c4197SStefano Zampini ierr = PetscFree(trs_rhs);CHKERRQ(ierr); 6317984c4197SStefano Zampini ierr = PetscFree(qr_tau);CHKERRQ(ierr); 6318984c4197SStefano Zampini ierr = PetscFree(qr_work);CHKERRQ(ierr); 6319984c4197SStefano Zampini ierr = PetscFree(gqr_work);CHKERRQ(ierr); 6320984c4197SStefano Zampini ierr = PetscFree(qr_basis);CHKERRQ(ierr); 6321674ae819SStefano Zampini } 6322a717540cSStefano Zampini ierr = PetscBTDestroy(&is_primal);CHKERRQ(ierr); 6323906d46d4SStefano Zampini ierr = MatAssemblyBegin(localChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6324906d46d4SStefano Zampini ierr = MatAssemblyEnd(localChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6325906d46d4SStefano Zampini 6326906d46d4SStefano Zampini /* assembling of global change of variable */ 632788c03ad3SStefano Zampini if (!pcbddc->fake_change) { 6328bbb9e6c6SStefano Zampini Mat tmat; 632916f15bc4SStefano Zampini PetscInt bs; 633016f15bc4SStefano Zampini 6331906d46d4SStefano Zampini ierr = VecGetSize(pcis->vec1_global,&global_size);CHKERRQ(ierr); 6332906d46d4SStefano Zampini ierr = VecGetLocalSize(pcis->vec1_global,&local_size);CHKERRQ(ierr); 6333bbb9e6c6SStefano Zampini ierr = MatDuplicate(pc->pmat,MAT_DO_NOT_COPY_VALUES,&tmat);CHKERRQ(ierr); 6334bbb9e6c6SStefano Zampini ierr = MatISSetLocalMat(tmat,localChangeOfBasisMatrix);CHKERRQ(ierr); 6335bbb9e6c6SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pc),&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 6336bbb9e6c6SStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,MATAIJ);CHKERRQ(ierr); 633716f15bc4SStefano Zampini ierr = MatGetBlockSize(pc->pmat,&bs);CHKERRQ(ierr); 633816f15bc4SStefano Zampini ierr = MatSetBlockSize(pcbddc->ChangeOfBasisMatrix,bs);CHKERRQ(ierr); 6339906d46d4SStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,local_size,local_size,global_size,global_size);CHKERRQ(ierr); 6340bbb9e6c6SStefano Zampini ierr = MatISSetMPIXAIJPreallocation_Private(tmat,pcbddc->ChangeOfBasisMatrix,PETSC_TRUE);CHKERRQ(ierr); 6341bbb9e6c6SStefano Zampini ierr = MatISGetMPIXAIJ(tmat,MAT_REUSE_MATRIX,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 6342bbb9e6c6SStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 6343bbb9e6c6SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 6344bbb9e6c6SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 6345e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6346e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6347bbb9e6c6SStefano Zampini ierr = VecReciprocal(pcis->vec1_global);CHKERRQ(ierr); 6348bbb9e6c6SStefano Zampini ierr = MatDiagonalScale(pcbddc->ChangeOfBasisMatrix,pcis->vec1_global,NULL);CHKERRQ(ierr); 634988c03ad3SStefano Zampini 6350906d46d4SStefano Zampini /* check */ 6351906d46d4SStefano Zampini if (pcbddc->dbg_flag) { 6352906d46d4SStefano Zampini PetscReal error; 6353906d46d4SStefano Zampini Vec x,x_change; 6354906d46d4SStefano Zampini 6355906d46d4SStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&x);CHKERRQ(ierr); 6356906d46d4SStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&x_change);CHKERRQ(ierr); 6357906d46d4SStefano Zampini ierr = VecSetRandom(x,NULL);CHKERRQ(ierr); 6358906d46d4SStefano Zampini ierr = VecCopy(x,pcis->vec1_global);CHKERRQ(ierr); 6359e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,x,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6360e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,x,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6361bbb9e6c6SStefano Zampini ierr = MatMult(localChangeOfBasisMatrix,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 6362e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec2_N,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6363e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec2_N,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6364906d46d4SStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_global,x_change);CHKERRQ(ierr); 6365906d46d4SStefano Zampini ierr = VecAXPY(x,-1.0,x_change);CHKERRQ(ierr); 6366906d46d4SStefano Zampini ierr = VecNorm(x,NORM_INFINITY,&error);CHKERRQ(ierr); 6367637e8532SStefano Zampini if (error > PETSC_SMALL) { 6368637e8532SStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"Error global vs local change on N: %1.6e\n",error); 6369637e8532SStefano Zampini } 6370906d46d4SStefano Zampini ierr = VecDestroy(&x);CHKERRQ(ierr); 6371906d46d4SStefano Zampini ierr = VecDestroy(&x_change);CHKERRQ(ierr); 6372906d46d4SStefano Zampini } 6373b96c3477SStefano Zampini /* adapt sub_schurs computed (if any) */ 6374b96c3477SStefano Zampini if (pcbddc->use_deluxe_scaling) { 6375b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs=pcbddc->sub_schurs; 6376bf3a8328SStefano Zampini 63779a962809SStefano Zampini if (pcbddc->use_change_of_basis && pcbddc->adaptive_userdefined) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Cannot mix automatic change of basis, adaptive selection and user-defined constraints");CHKERRQ(ierr); 6378b334f244SStefano Zampini if (sub_schurs && sub_schurs->S_Ej_all) { 6379ac632422SStefano Zampini Mat S_new,tmat; 6380bf3a8328SStefano Zampini IS is_all_N,is_V_Sall = NULL; 6381bbb9e6c6SStefano Zampini 6382bbb9e6c6SStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pcis->BtoNmap,sub_schurs->is_Ej_all,&is_all_N);CHKERRQ(ierr); 63837dae84e0SHong Zhang ierr = MatCreateSubMatrix(localChangeOfBasisMatrix,is_all_N,is_all_N,MAT_INITIAL_MATRIX,&tmat);CHKERRQ(ierr); 6384bf3a8328SStefano Zampini if (pcbddc->deluxe_zerorows) { 6385bf3a8328SStefano Zampini ISLocalToGlobalMapping NtoSall; 6386bf3a8328SStefano Zampini IS is_V; 6387b087196eSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->n_vertices,pcbddc->local_primal_ref_node,PETSC_COPY_VALUES,&is_V);CHKERRQ(ierr); 6388b087196eSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_all_N,&NtoSall);CHKERRQ(ierr); 6389b087196eSStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(NtoSall,IS_GTOLM_DROP,is_V,&is_V_Sall);CHKERRQ(ierr); 6390b087196eSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&NtoSall);CHKERRQ(ierr); 6391b087196eSStefano Zampini ierr = ISDestroy(&is_V);CHKERRQ(ierr); 6392bf3a8328SStefano Zampini } 6393bf3a8328SStefano Zampini ierr = ISDestroy(&is_all_N);CHKERRQ(ierr); 6394ac632422SStefano Zampini ierr = MatPtAP(sub_schurs->S_Ej_all,tmat,MAT_INITIAL_MATRIX,1.0,&S_new);CHKERRQ(ierr); 6395b96c3477SStefano Zampini ierr = MatDestroy(&sub_schurs->S_Ej_all);CHKERRQ(ierr); 6396ac632422SStefano Zampini ierr = PetscObjectReference((PetscObject)S_new);CHKERRQ(ierr); 6397bf3a8328SStefano Zampini if (pcbddc->deluxe_zerorows) { 6398bf3a8328SStefano Zampini const PetscScalar *array; 6399bf3a8328SStefano Zampini const PetscInt *idxs_V,*idxs_all; 6400bf3a8328SStefano Zampini PetscInt i,n_V; 6401bf3a8328SStefano Zampini 6402b087196eSStefano Zampini ierr = MatZeroRowsColumnsIS(S_new,is_V_Sall,1.,NULL,NULL);CHKERRQ(ierr); 6403b087196eSStefano Zampini ierr = ISGetLocalSize(is_V_Sall,&n_V);CHKERRQ(ierr); 6404b087196eSStefano Zampini ierr = ISGetIndices(is_V_Sall,&idxs_V);CHKERRQ(ierr); 6405b087196eSStefano Zampini ierr = ISGetIndices(sub_schurs->is_Ej_all,&idxs_all);CHKERRQ(ierr); 6406b087196eSStefano Zampini ierr = VecGetArrayRead(pcis->D,&array);CHKERRQ(ierr); 6407b087196eSStefano Zampini for (i=0;i<n_V;i++) { 6408b087196eSStefano Zampini PetscScalar val; 6409b087196eSStefano Zampini PetscInt idx; 6410b087196eSStefano Zampini 6411b087196eSStefano Zampini idx = idxs_V[i]; 6412b087196eSStefano Zampini val = array[idxs_all[idxs_V[i]]]; 6413b087196eSStefano Zampini ierr = MatSetValue(S_new,idx,idx,val,INSERT_VALUES);CHKERRQ(ierr); 6414b087196eSStefano Zampini } 6415b087196eSStefano Zampini ierr = MatAssemblyBegin(S_new,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6416b087196eSStefano Zampini ierr = MatAssemblyEnd(S_new,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6417bf3a8328SStefano Zampini ierr = VecRestoreArrayRead(pcis->D,&array);CHKERRQ(ierr); 6418bf3a8328SStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_Ej_all,&idxs_all);CHKERRQ(ierr); 6419bf3a8328SStefano Zampini ierr = ISRestoreIndices(is_V_Sall,&idxs_V);CHKERRQ(ierr); 6420bf3a8328SStefano Zampini } 6421ac632422SStefano Zampini sub_schurs->S_Ej_all = S_new; 6422ac632422SStefano Zampini ierr = MatDestroy(&S_new);CHKERRQ(ierr); 6423ac632422SStefano Zampini if (sub_schurs->sum_S_Ej_all) { 6424ac632422SStefano Zampini ierr = MatPtAP(sub_schurs->sum_S_Ej_all,tmat,MAT_INITIAL_MATRIX,1.0,&S_new);CHKERRQ(ierr); 6425b96c3477SStefano Zampini ierr = MatDestroy(&sub_schurs->sum_S_Ej_all);CHKERRQ(ierr); 6426ac632422SStefano Zampini ierr = PetscObjectReference((PetscObject)S_new);CHKERRQ(ierr); 6427bf3a8328SStefano Zampini if (pcbddc->deluxe_zerorows) { 6428b087196eSStefano Zampini ierr = MatZeroRowsColumnsIS(S_new,is_V_Sall,1.,NULL,NULL);CHKERRQ(ierr); 6429bf3a8328SStefano Zampini } 6430ac632422SStefano Zampini sub_schurs->sum_S_Ej_all = S_new; 6431ac632422SStefano Zampini ierr = MatDestroy(&S_new);CHKERRQ(ierr); 6432ac632422SStefano Zampini } 6433b087196eSStefano Zampini ierr = ISDestroy(&is_V_Sall);CHKERRQ(ierr); 643488c03ad3SStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 6435b96c3477SStefano Zampini } 6436c9db6a07SStefano Zampini /* destroy any change of basis context in sub_schurs */ 6437b334f244SStefano Zampini if (sub_schurs && sub_schurs->change) { 6438c9db6a07SStefano Zampini PetscInt i; 6439c9db6a07SStefano Zampini 6440c9db6a07SStefano Zampini for (i=0;i<sub_schurs->n_subs;i++) { 6441c9db6a07SStefano Zampini ierr = KSPDestroy(&sub_schurs->change[i]);CHKERRQ(ierr); 6442c9db6a07SStefano Zampini } 6443c9db6a07SStefano Zampini ierr = PetscFree(sub_schurs->change);CHKERRQ(ierr); 6444c9db6a07SStefano Zampini } 6445b96c3477SStefano Zampini } 644616909a7fSStefano Zampini if (pcbddc->switch_static) { /* need to save the local change */ 644716909a7fSStefano Zampini pcbddc->switch_static_change = localChangeOfBasisMatrix; 644816909a7fSStefano Zampini } else { 6449906d46d4SStefano Zampini ierr = MatDestroy(&localChangeOfBasisMatrix);CHKERRQ(ierr); 645016909a7fSStefano Zampini } 64511dd7afcfSStefano Zampini /* determine if any process has changed the pressures locally */ 645227b6a85dSStefano Zampini pcbddc->change_interior = pcbddc->benign_have_null; 645372b8c272SStefano Zampini } else { /* fake change (get back change of basis into ConstraintMatrix and info on qr) */ 645472b8c272SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 645572b8c272SStefano Zampini pcbddc->ConstraintMatrix = localChangeOfBasisMatrix; 645672b8c272SStefano Zampini pcbddc->use_qr_single = qr_needed; 645772b8c272SStefano Zampini } 64581dd7afcfSStefano Zampini } else if (pcbddc->user_ChangeOfBasisMatrix || pcbddc->benign_saddle_point) { 645927b6a85dSStefano Zampini if (!pcbddc->benign_have_null && pcbddc->user_ChangeOfBasisMatrix) { 6460b9b85e73SStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->user_ChangeOfBasisMatrix);CHKERRQ(ierr); 6461b9b85e73SStefano Zampini pcbddc->ChangeOfBasisMatrix = pcbddc->user_ChangeOfBasisMatrix; 6462906d46d4SStefano Zampini } else { 64631dd7afcfSStefano Zampini Mat benign_global = NULL; 646427b6a85dSStefano Zampini if (pcbddc->benign_have_null) { 64651dd7afcfSStefano Zampini Mat tmat; 64661dd7afcfSStefano Zampini 64671dd7afcfSStefano Zampini pcbddc->change_interior = PETSC_TRUE; 64681dd7afcfSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 64691dd7afcfSStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 64701dd7afcfSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 64711dd7afcfSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 64721dd7afcfSStefano Zampini ierr = VecReciprocal(pcis->vec1_global);CHKERRQ(ierr); 64731dd7afcfSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 64741dd7afcfSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 64751dd7afcfSStefano Zampini ierr = MatDuplicate(pc->pmat,MAT_DO_NOT_COPY_VALUES,&tmat);CHKERRQ(ierr); 64761dd7afcfSStefano Zampini if (pcbddc->benign_change) { 64771dd7afcfSStefano Zampini Mat M; 64781dd7afcfSStefano Zampini 64791dd7afcfSStefano Zampini ierr = MatDuplicate(pcbddc->benign_change,MAT_COPY_VALUES,&M);CHKERRQ(ierr); 64801dd7afcfSStefano Zampini ierr = MatDiagonalScale(M,pcis->vec1_N,NULL);CHKERRQ(ierr); 64811dd7afcfSStefano Zampini ierr = MatISSetLocalMat(tmat,M);CHKERRQ(ierr); 64821dd7afcfSStefano Zampini ierr = MatDestroy(&M);CHKERRQ(ierr); 6483906d46d4SStefano Zampini } else { 64841dd7afcfSStefano Zampini Mat eye; 64851dd7afcfSStefano Zampini PetscScalar *array; 64861dd7afcfSStefano Zampini 64871dd7afcfSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 64881dd7afcfSStefano Zampini ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,pcis->n,pcis->n,1,NULL,&eye);CHKERRQ(ierr); 64891dd7afcfSStefano Zampini for (i=0;i<pcis->n;i++) { 64901dd7afcfSStefano Zampini ierr = MatSetValue(eye,i,i,array[i],INSERT_VALUES);CHKERRQ(ierr); 6491906d46d4SStefano Zampini } 64921dd7afcfSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 64931dd7afcfSStefano Zampini ierr = MatAssemblyBegin(eye,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 64941dd7afcfSStefano Zampini ierr = MatAssemblyEnd(eye,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 64951dd7afcfSStefano Zampini ierr = MatISSetLocalMat(tmat,eye);CHKERRQ(ierr); 64961dd7afcfSStefano Zampini ierr = MatDestroy(&eye);CHKERRQ(ierr); 64971dd7afcfSStefano Zampini } 64981dd7afcfSStefano Zampini ierr = MatISGetMPIXAIJ(tmat,MAT_INITIAL_MATRIX,&benign_global);CHKERRQ(ierr); 64991dd7afcfSStefano Zampini ierr = MatDestroy(&tmat);CHKERRQ(ierr); 65001dd7afcfSStefano Zampini } 65011dd7afcfSStefano Zampini if (pcbddc->user_ChangeOfBasisMatrix) { 65021dd7afcfSStefano Zampini ierr = MatMatMult(pcbddc->user_ChangeOfBasisMatrix,benign_global,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 65031dd7afcfSStefano Zampini ierr = MatDestroy(&benign_global);CHKERRQ(ierr); 650427b6a85dSStefano Zampini } else if (pcbddc->benign_have_null) { 65051dd7afcfSStefano Zampini pcbddc->ChangeOfBasisMatrix = benign_global; 65061dd7afcfSStefano Zampini } 65071dd7afcfSStefano Zampini } 650816909a7fSStefano Zampini if (pcbddc->switch_static && pcbddc->ChangeOfBasisMatrix) { /* need to save the local change */ 650916909a7fSStefano Zampini IS is_global; 651016909a7fSStefano Zampini const PetscInt *gidxs; 651116909a7fSStefano Zampini 651216909a7fSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(pc->pmat->rmap->mapping,&gidxs);CHKERRQ(ierr); 651316909a7fSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),pcis->n,gidxs,PETSC_COPY_VALUES,&is_global);CHKERRQ(ierr); 651416909a7fSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(pc->pmat->rmap->mapping,&gidxs);CHKERRQ(ierr); 65157dae84e0SHong Zhang ierr = MatCreateSubMatrixUnsorted(pcbddc->ChangeOfBasisMatrix,is_global,is_global,&pcbddc->switch_static_change);CHKERRQ(ierr); 651616909a7fSStefano Zampini ierr = ISDestroy(&is_global);CHKERRQ(ierr); 651716909a7fSStefano Zampini } 65181dd7afcfSStefano Zampini } 65191dd7afcfSStefano Zampini if (!pcbddc->fake_change && pcbddc->ChangeOfBasisMatrix && !pcbddc->work_change) { 65201dd7afcfSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->work_change);CHKERRQ(ierr); 6521b9b85e73SStefano Zampini } 6522a717540cSStefano Zampini 652372b8c272SStefano Zampini if (!pcbddc->fake_change) { 65244f1b2e48SStefano Zampini /* add pressure dofs to set of primal nodes for numbering purposes */ 65254f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 65264f1b2e48SStefano Zampini pcbddc->local_primal_ref_node[pcbddc->local_primal_size_cc] = pcbddc->benign_p0_lidx[i]; 65274f1b2e48SStefano Zampini pcbddc->primal_indices_local_idxs[pcbddc->local_primal_size] = pcbddc->benign_p0_lidx[i]; 6528019a44ceSStefano Zampini pcbddc->local_primal_ref_mult[pcbddc->local_primal_size_cc] = 1; 6529019a44ceSStefano Zampini pcbddc->local_primal_size_cc++; 6530019a44ceSStefano Zampini pcbddc->local_primal_size++; 6531019a44ceSStefano Zampini } 6532019a44ceSStefano Zampini 6533019a44ceSStefano Zampini /* check if a new primal space has been introduced (also take into account benign trick) */ 6534727cdba6SStefano Zampini pcbddc->new_primal_space_local = PETSC_TRUE; 6535727cdba6SStefano Zampini if (olocal_primal_size == pcbddc->local_primal_size) { 65369f47a83aSStefano Zampini ierr = PetscMemcmp(pcbddc->local_primal_ref_node,olocal_primal_ref_node,olocal_primal_size_cc*sizeof(PetscInt),&pcbddc->new_primal_space_local);CHKERRQ(ierr); 6537c1c8e736SStefano Zampini pcbddc->new_primal_space_local = (PetscBool)(!pcbddc->new_primal_space_local); 65380e6343abSStefano Zampini if (!pcbddc->new_primal_space_local) { 65399f47a83aSStefano Zampini ierr = PetscMemcmp(pcbddc->local_primal_ref_mult,olocal_primal_ref_mult,olocal_primal_size_cc*sizeof(PetscInt),&pcbddc->new_primal_space_local);CHKERRQ(ierr); 6540727cdba6SStefano Zampini pcbddc->new_primal_space_local = (PetscBool)(!pcbddc->new_primal_space_local); 6541727cdba6SStefano Zampini } 65420e6343abSStefano Zampini } 6543727cdba6SStefano Zampini /* new_primal_space will be used for numbering of coarse dofs, so it should be the same across all subdomains */ 6544b2566f29SBarry Smith ierr = MPIU_Allreduce(&pcbddc->new_primal_space_local,&pcbddc->new_primal_space,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 654572b8c272SStefano Zampini } 654672b8c272SStefano Zampini ierr = PetscFree2(olocal_primal_ref_node,olocal_primal_ref_mult);CHKERRQ(ierr); 6547727cdba6SStefano Zampini 6548a717540cSStefano Zampini /* flush dbg viewer */ 6549b8ffe317SStefano Zampini if (pcbddc->dbg_flag) { 6550b8ffe317SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 6551b8ffe317SStefano Zampini } 6552a717540cSStefano Zampini 6553e310c8b4SStefano Zampini /* free workspace */ 6554a717540cSStefano Zampini ierr = PetscBTDestroy(&qr_needed_idx);CHKERRQ(ierr); 65554641a718SStefano Zampini ierr = PetscBTDestroy(&change_basis);CHKERRQ(ierr); 655608122e43SStefano Zampini if (!pcbddc->adaptive_selection) { 65579162d606SStefano Zampini ierr = PetscFree3(constraints_idxs_ptr,constraints_data_ptr,constraints_n);CHKERRQ(ierr); 65589162d606SStefano Zampini ierr = PetscFree3(constraints_data,constraints_idxs,constraints_idxs_B);CHKERRQ(ierr); 655908122e43SStefano Zampini } else { 65609162d606SStefano Zampini ierr = PetscFree5(pcbddc->adaptive_constraints_n, 65619162d606SStefano Zampini pcbddc->adaptive_constraints_idxs_ptr, 65629162d606SStefano Zampini pcbddc->adaptive_constraints_data_ptr, 656308122e43SStefano Zampini pcbddc->adaptive_constraints_idxs, 656408122e43SStefano Zampini pcbddc->adaptive_constraints_data);CHKERRQ(ierr); 65659162d606SStefano Zampini ierr = PetscFree(constraints_n);CHKERRQ(ierr); 65669162d606SStefano Zampini ierr = PetscFree(constraints_idxs_B);CHKERRQ(ierr); 656708122e43SStefano Zampini } 6568674ae819SStefano Zampini PetscFunctionReturn(0); 6569674ae819SStefano Zampini } 6570674ae819SStefano Zampini 6571674ae819SStefano Zampini PetscErrorCode PCBDDCAnalyzeInterface(PC pc) 6572674ae819SStefano Zampini { 657371582508SStefano Zampini ISLocalToGlobalMapping map; 6574674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 6575674ae819SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 657666da6bd7Sstefano_zampini PetscInt i,N; 657766da6bd7Sstefano_zampini PetscBool rcsr = PETSC_FALSE; 657866da6bd7Sstefano_zampini PetscErrorCode ierr; 6579674ae819SStefano Zampini 6580674ae819SStefano Zampini PetscFunctionBegin; 65818af8fcf9SStefano Zampini if (pcbddc->recompute_topography) { 6582b03ebc13SStefano Zampini pcbddc->graphanalyzed = PETSC_FALSE; 65838e61c736SStefano Zampini /* Reset previously computed graph */ 65848e61c736SStefano Zampini ierr = PCBDDCGraphReset(pcbddc->mat_graph);CHKERRQ(ierr); 6585674ae819SStefano Zampini /* Init local Graph struct */ 65867fb0e2dbSStefano Zampini ierr = MatGetSize(pc->pmat,&N,NULL);CHKERRQ(ierr); 658771582508SStefano Zampini ierr = MatGetLocalToGlobalMapping(pc->pmat,&map,NULL);CHKERRQ(ierr); 6588be12c134Sstefano_zampini ierr = PCBDDCGraphInit(pcbddc->mat_graph,map,N,pcbddc->graphmaxcount);CHKERRQ(ierr); 6589674ae819SStefano Zampini 65907a0e7b2cSstefano_zampini if (pcbddc->user_primal_vertices_local && !pcbddc->user_primal_vertices) { 65917a0e7b2cSstefano_zampini ierr = PCBDDCConsistencyCheckIS(pc,MPI_LOR,&pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 65927a0e7b2cSstefano_zampini } 6593575ad6abSStefano Zampini /* Check validity of the csr graph passed in by the user */ 65949a962809SStefano Zampini if (pcbddc->mat_graph->nvtxs_csr && pcbddc->mat_graph->nvtxs_csr != pcbddc->mat_graph->nvtxs) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Invalid size of local CSR graph! Found %d, expected %d\n",pcbddc->mat_graph->nvtxs_csr,pcbddc->mat_graph->nvtxs); 65959577ea80SStefano Zampini 6596674ae819SStefano Zampini /* Set default CSR adjacency of local dofs if not provided by the user with PCBDDCSetLocalAdjacencyGraph */ 659766da6bd7Sstefano_zampini if (!pcbddc->mat_graph->xadj && pcbddc->use_local_adj) { 65984d379d7bSStefano Zampini PetscInt *xadj,*adjncy; 65994d379d7bSStefano Zampini PetscInt nvtxs; 6600e496cd5dSStefano Zampini PetscBool flg_row=PETSC_FALSE; 6601674ae819SStefano Zampini 66022fffb893SStefano Zampini ierr = MatGetRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 66032fffb893SStefano Zampini if (flg_row) { 66044d379d7bSStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 6605b96c3477SStefano Zampini pcbddc->computed_rowadj = PETSC_TRUE; 66062fffb893SStefano Zampini } 66072fffb893SStefano Zampini ierr = MatRestoreRowIJ(matis->A,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,(const PetscInt**)&xadj,(const PetscInt**)&adjncy,&flg_row);CHKERRQ(ierr); 660866da6bd7Sstefano_zampini rcsr = PETSC_TRUE; 6609674ae819SStefano Zampini } 66109b28b941SStefano Zampini if (pcbddc->dbg_flag) { 66119b28b941SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 6612674ae819SStefano Zampini } 6613674ae819SStefano Zampini 6614674ae819SStefano Zampini /* Setup of Graph */ 66154b2aedd3SStefano Zampini pcbddc->mat_graph->commsizelimit = 0; /* don't use the COMM_SELF variant of the graph */ 661614f95afaSStefano Zampini ierr = PCBDDCGraphSetUp(pcbddc->mat_graph,pcbddc->vertex_size,pcbddc->NeumannBoundariesLocal,pcbddc->DirichletBoundariesLocal,pcbddc->n_ISForDofsLocal,pcbddc->ISForDofsLocal,pcbddc->user_primal_vertices_local);CHKERRQ(ierr); 6617674ae819SStefano Zampini 66184f1b2e48SStefano Zampini /* attach info on disconnected subdomains if present */ 66194f1b2e48SStefano Zampini if (pcbddc->n_local_subs) { 66204f1b2e48SStefano Zampini PetscInt *local_subs; 66214f1b2e48SStefano Zampini 66224f1b2e48SStefano Zampini ierr = PetscMalloc1(N,&local_subs);CHKERRQ(ierr); 66234f1b2e48SStefano Zampini for (i=0;i<pcbddc->n_local_subs;i++) { 66244f1b2e48SStefano Zampini const PetscInt *idxs; 66254f1b2e48SStefano Zampini PetscInt nl,j; 66264f1b2e48SStefano Zampini 66274f1b2e48SStefano Zampini ierr = ISGetLocalSize(pcbddc->local_subs[i],&nl);CHKERRQ(ierr); 66284f1b2e48SStefano Zampini ierr = ISGetIndices(pcbddc->local_subs[i],&idxs);CHKERRQ(ierr); 662971582508SStefano Zampini for (j=0;j<nl;j++) local_subs[idxs[j]] = i; 66304f1b2e48SStefano Zampini ierr = ISRestoreIndices(pcbddc->local_subs[i],&idxs);CHKERRQ(ierr); 66314f1b2e48SStefano Zampini } 66324f1b2e48SStefano Zampini pcbddc->mat_graph->n_local_subs = pcbddc->n_local_subs; 66334f1b2e48SStefano Zampini pcbddc->mat_graph->local_subs = local_subs; 66344f1b2e48SStefano Zampini } 66358af8fcf9SStefano Zampini } 66364f1b2e48SStefano Zampini 6637cac5312eSStefano Zampini if (!pcbddc->graphanalyzed) { 6638674ae819SStefano Zampini /* Graph's connected components analysis */ 6639674ae819SStefano Zampini ierr = PCBDDCGraphComputeConnectedComponents(pcbddc->mat_graph);CHKERRQ(ierr); 664071582508SStefano Zampini pcbddc->graphanalyzed = PETSC_TRUE; 66418af8fcf9SStefano Zampini } 664266da6bd7Sstefano_zampini if (rcsr) pcbddc->mat_graph->nvtxs_csr = 0; 6643674ae819SStefano Zampini PetscFunctionReturn(0); 6644674ae819SStefano Zampini } 6645674ae819SStefano Zampini 66469a7d3425SStefano Zampini PetscErrorCode PCBDDCOrthonormalizeVecs(PetscInt n, Vec vecs[]) 66479a7d3425SStefano Zampini { 66489a7d3425SStefano Zampini PetscInt i,j; 66499a7d3425SStefano Zampini PetscScalar *alphas; 66509a7d3425SStefano Zampini PetscErrorCode ierr; 66519a7d3425SStefano Zampini 66529a7d3425SStefano Zampini PetscFunctionBegin; 6653785e854fSJed Brown ierr = PetscMalloc1(n,&alphas);CHKERRQ(ierr); 66549a7d3425SStefano Zampini for (i=0;i<n;i++) { 66559a7d3425SStefano Zampini ierr = VecNormalize(vecs[i],NULL);CHKERRQ(ierr); 6656669cc0f4SStefano Zampini ierr = VecMDot(vecs[i],n-i-1,&vecs[i+1],alphas);CHKERRQ(ierr); 6657669cc0f4SStefano Zampini for (j=0;j<n-i-1;j++) alphas[j] = PetscConj(-alphas[j]); 6658669cc0f4SStefano Zampini ierr = VecMAXPY(vecs[j],n-i-1,alphas,vecs+i);CHKERRQ(ierr); 66599a7d3425SStefano Zampini } 66609a7d3425SStefano Zampini ierr = PetscFree(alphas);CHKERRQ(ierr); 66619a7d3425SStefano Zampini PetscFunctionReturn(0); 66629a7d3425SStefano Zampini } 66639a7d3425SStefano Zampini 6664bb360cb4SStefano Zampini PetscErrorCode PCBDDCMatISGetSubassemblingPattern(Mat mat, PetscInt *n_subdomains, PetscInt redprocs, IS* is_sends, PetscBool *have_void) 6665e7931f94SStefano Zampini { 666657de7509SStefano Zampini Mat A; 6667e7931f94SStefano Zampini PetscInt n_neighs,*neighs,*n_shared,**shared; 6668e7931f94SStefano Zampini PetscMPIInt size,rank,color; 666952e5ac9dSStefano Zampini PetscInt *xadj,*adjncy; 667052e5ac9dSStefano Zampini PetscInt *adjncy_wgt,*v_wgt,*ranks_send_to_idx; 6671bb360cb4SStefano Zampini PetscInt im_active,active_procs,N,n,i,j,threshold = 2; 667257de7509SStefano Zampini PetscInt void_procs,*procs_candidates = NULL; 667327b6a85dSStefano Zampini PetscInt xadj_count,*count; 667427b6a85dSStefano Zampini PetscBool ismatis,use_vwgt=PETSC_FALSE; 667527b6a85dSStefano Zampini PetscSubcomm psubcomm; 667627b6a85dSStefano Zampini MPI_Comm subcomm; 667752e5ac9dSStefano Zampini PetscErrorCode ierr; 6678a57a6d2fSStefano Zampini 6679e7931f94SStefano Zampini PetscFunctionBegin; 668057de7509SStefano Zampini PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 668157de7509SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)mat,MATIS,&ismatis);CHKERRQ(ierr); 6682fbfcfee5SBarry Smith if (!ismatis) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot use %s on a matrix object which is not of type MATIS",PETSC_FUNCTION_NAME); 668357de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,*n_subdomains,2); 668457de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,redprocs,3); 668557de7509SStefano Zampini if (*n_subdomains <=0) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_WRONG,"Invalid number of subdomains requested %d\n",*n_subdomains); 668657de7509SStefano Zampini 668757de7509SStefano Zampini if (have_void) *have_void = PETSC_FALSE; 668857de7509SStefano Zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)mat),&size);CHKERRQ(ierr); 668957de7509SStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)mat),&rank);CHKERRQ(ierr); 669057de7509SStefano Zampini ierr = MatISGetLocalMat(mat,&A);CHKERRQ(ierr); 669157de7509SStefano Zampini ierr = MatGetLocalSize(A,&n,NULL);CHKERRQ(ierr); 6692bb360cb4SStefano Zampini im_active = !!n; 669357de7509SStefano Zampini ierr = MPIU_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr); 669457de7509SStefano Zampini void_procs = size - active_procs; 669557de7509SStefano Zampini /* get ranks of of non-active processes in mat communicator */ 669657de7509SStefano Zampini if (void_procs) { 669757de7509SStefano Zampini PetscInt ncand; 669857de7509SStefano Zampini 669957de7509SStefano Zampini if (have_void) *have_void = PETSC_TRUE; 670057de7509SStefano Zampini ierr = PetscMalloc1(size,&procs_candidates);CHKERRQ(ierr); 670157de7509SStefano Zampini ierr = MPI_Allgather(&im_active,1,MPIU_INT,procs_candidates,1,MPIU_INT,PetscObjectComm((PetscObject)mat));CHKERRQ(ierr); 670257de7509SStefano Zampini for (i=0,ncand=0;i<size;i++) { 670357de7509SStefano Zampini if (!procs_candidates[i]) { 670457de7509SStefano Zampini procs_candidates[ncand++] = i; 670557de7509SStefano Zampini } 670657de7509SStefano Zampini } 670757de7509SStefano Zampini /* force n_subdomains to be not greater that the number of non-active processes */ 670857de7509SStefano Zampini *n_subdomains = PetscMin(void_procs,*n_subdomains); 670957de7509SStefano Zampini } 671057de7509SStefano Zampini 6711bb360cb4SStefano Zampini /* number of subdomains requested greater than active processes or matrix size -> just shift the matrix 671214f0bfb9SStefano Zampini number of subdomains requested 1 -> send to master or first candidate in voids */ 6713bb360cb4SStefano Zampini ierr = MatGetSize(mat,&N,NULL);CHKERRQ(ierr); 6714bb360cb4SStefano Zampini if (active_procs < *n_subdomains || *n_subdomains == 1 || N <= *n_subdomains) { 671514f0bfb9SStefano Zampini PetscInt issize,isidx,dest; 671614f0bfb9SStefano Zampini if (*n_subdomains == 1) dest = 0; 671714f0bfb9SStefano Zampini else dest = rank; 671857de7509SStefano Zampini if (im_active) { 671957de7509SStefano Zampini issize = 1; 672057de7509SStefano Zampini if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */ 672114f0bfb9SStefano Zampini isidx = procs_candidates[dest]; 672257de7509SStefano Zampini } else { 672314f0bfb9SStefano Zampini isidx = dest; 672457de7509SStefano Zampini } 672557de7509SStefano Zampini } else { 672657de7509SStefano Zampini issize = 0; 672757de7509SStefano Zampini isidx = -1; 672857de7509SStefano Zampini } 6729bb360cb4SStefano Zampini if (*n_subdomains != 1) *n_subdomains = active_procs; 673057de7509SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)mat),issize,&isidx,PETSC_COPY_VALUES,is_sends);CHKERRQ(ierr); 6731daf8a457SStefano Zampini ierr = PetscFree(procs_candidates);CHKERRQ(ierr); 673257de7509SStefano Zampini PetscFunctionReturn(0); 673357de7509SStefano Zampini } 6734c5929fdfSBarry Smith ierr = PetscOptionsGetBool(NULL,NULL,"-matis_partitioning_use_vwgt",&use_vwgt,NULL);CHKERRQ(ierr); 6735c5929fdfSBarry Smith ierr = PetscOptionsGetInt(NULL,NULL,"-matis_partitioning_threshold",&threshold,NULL);CHKERRQ(ierr); 673627b6a85dSStefano Zampini threshold = PetscMax(threshold,2); 6737e7931f94SStefano Zampini 6738e7931f94SStefano Zampini /* Get info on mapping */ 67393bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingGetInfo(mat->rmap->mapping,&n_neighs,&neighs,&n_shared,&shared);CHKERRQ(ierr); 6740e7931f94SStefano Zampini 6741e7931f94SStefano Zampini /* build local CSR graph of subdomains' connectivity */ 6742785e854fSJed Brown ierr = PetscMalloc1(2,&xadj);CHKERRQ(ierr); 6743e7931f94SStefano Zampini xadj[0] = 0; 6744e7931f94SStefano Zampini xadj[1] = PetscMax(n_neighs-1,0); 6745785e854fSJed Brown ierr = PetscMalloc1(xadj[1],&adjncy);CHKERRQ(ierr); 6746785e854fSJed Brown ierr = PetscMalloc1(xadj[1],&adjncy_wgt);CHKERRQ(ierr); 6747bb360cb4SStefano Zampini ierr = PetscCalloc1(n,&count);CHKERRQ(ierr); 674827b6a85dSStefano Zampini for (i=1;i<n_neighs;i++) 674927b6a85dSStefano Zampini for (j=0;j<n_shared[i];j++) 675027b6a85dSStefano Zampini count[shared[i][j]] += 1; 6751e7931f94SStefano Zampini 675227b6a85dSStefano Zampini xadj_count = 0; 67532b510759SStefano Zampini for (i=1;i<n_neighs;i++) { 675427b6a85dSStefano Zampini for (j=0;j<n_shared[i];j++) { 675527b6a85dSStefano Zampini if (count[shared[i][j]] < threshold) { 6756d023bfaeSStefano Zampini adjncy[xadj_count] = neighs[i]; 6757d023bfaeSStefano Zampini adjncy_wgt[xadj_count] = n_shared[i]; 6758d023bfaeSStefano Zampini xadj_count++; 675927b6a85dSStefano Zampini break; 676027b6a85dSStefano Zampini } 6761e7931f94SStefano Zampini } 6762e7931f94SStefano Zampini } 6763d023bfaeSStefano Zampini xadj[1] = xadj_count; 676427b6a85dSStefano Zampini ierr = PetscFree(count);CHKERRQ(ierr); 67653bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingRestoreInfo(mat->rmap->mapping,&n_neighs,&neighs,&n_shared,&shared);CHKERRQ(ierr); 6766e7931f94SStefano Zampini ierr = PetscSortIntWithArray(xadj[1],adjncy,adjncy_wgt);CHKERRQ(ierr); 6767e7931f94SStefano Zampini 67683837a79fSStefano Zampini ierr = PetscMalloc1(1,&ranks_send_to_idx);CHKERRQ(ierr); 6769e7931f94SStefano Zampini 677027b6a85dSStefano Zampini /* Restrict work on active processes only */ 677127b6a85dSStefano Zampini ierr = PetscMPIIntCast(im_active,&color);CHKERRQ(ierr); 677227b6a85dSStefano Zampini if (void_procs) { 677327b6a85dSStefano Zampini ierr = PetscSubcommCreate(PetscObjectComm((PetscObject)mat),&psubcomm);CHKERRQ(ierr); 677427b6a85dSStefano Zampini ierr = PetscSubcommSetNumber(psubcomm,2);CHKERRQ(ierr); /* 2 groups, active process and not active processes */ 677527b6a85dSStefano Zampini ierr = PetscSubcommSetTypeGeneral(psubcomm,color,rank);CHKERRQ(ierr); 677627b6a85dSStefano Zampini subcomm = PetscSubcommChild(psubcomm); 677727b6a85dSStefano Zampini } else { 677827b6a85dSStefano Zampini psubcomm = NULL; 677927b6a85dSStefano Zampini subcomm = PetscObjectComm((PetscObject)mat); 678027b6a85dSStefano Zampini } 678127b6a85dSStefano Zampini 678227b6a85dSStefano Zampini v_wgt = NULL; 678327b6a85dSStefano Zampini if (!color) { 6784e7931f94SStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 6785e7931f94SStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 6786e7931f94SStefano Zampini ierr = PetscFree(adjncy_wgt);CHKERRQ(ierr); 6787c8587f34SStefano Zampini } else { 678852e5ac9dSStefano Zampini Mat subdomain_adj; 678952e5ac9dSStefano Zampini IS new_ranks,new_ranks_contig; 679052e5ac9dSStefano Zampini MatPartitioning partitioner; 679127b6a85dSStefano Zampini PetscInt rstart=0,rend=0; 679252e5ac9dSStefano Zampini PetscInt *is_indices,*oldranks; 679357de7509SStefano Zampini PetscMPIInt size; 6794b0c7d250SStefano Zampini PetscBool aggregate; 6795b0c7d250SStefano Zampini 679627b6a85dSStefano Zampini ierr = MPI_Comm_size(subcomm,&size);CHKERRQ(ierr); 679727b6a85dSStefano Zampini if (void_procs) { 679827b6a85dSStefano Zampini PetscInt prank = rank; 6799785e854fSJed Brown ierr = PetscMalloc1(size,&oldranks);CHKERRQ(ierr); 680027b6a85dSStefano Zampini ierr = MPI_Allgather(&prank,1,MPIU_INT,oldranks,1,MPIU_INT,subcomm);CHKERRQ(ierr); 6801e7931f94SStefano Zampini for (i=0;i<xadj[1];i++) { 6802e7931f94SStefano Zampini ierr = PetscFindInt(adjncy[i],size,oldranks,&adjncy[i]);CHKERRQ(ierr); 6803c8587f34SStefano Zampini } 6804e7931f94SStefano Zampini ierr = PetscSortIntWithArray(xadj[1],adjncy,adjncy_wgt);CHKERRQ(ierr); 680527b6a85dSStefano Zampini } else { 680627b6a85dSStefano Zampini oldranks = NULL; 680727b6a85dSStefano Zampini } 6808b0c7d250SStefano Zampini aggregate = ((redprocs > 0 && redprocs < size) ? PETSC_TRUE : PETSC_FALSE); 680927b6a85dSStefano Zampini if (aggregate) { /* TODO: all this part could be made more efficient */ 6810b0c7d250SStefano Zampini PetscInt lrows,row,ncols,*cols; 6811b0c7d250SStefano Zampini PetscMPIInt nrank; 6812b0c7d250SStefano Zampini PetscScalar *vals; 6813b0c7d250SStefano Zampini 681427b6a85dSStefano Zampini ierr = MPI_Comm_rank(subcomm,&nrank);CHKERRQ(ierr); 6815b0c7d250SStefano Zampini lrows = 0; 6816b0c7d250SStefano Zampini if (nrank<redprocs) { 6817b0c7d250SStefano Zampini lrows = size/redprocs; 6818b0c7d250SStefano Zampini if (nrank<size%redprocs) lrows++; 6819b0c7d250SStefano Zampini } 682027b6a85dSStefano Zampini ierr = MatCreateAIJ(subcomm,lrows,lrows,size,size,50,NULL,50,NULL,&subdomain_adj);CHKERRQ(ierr); 6821b0c7d250SStefano Zampini ierr = MatGetOwnershipRange(subdomain_adj,&rstart,&rend);CHKERRQ(ierr); 6822b0c7d250SStefano Zampini ierr = MatSetOption(subdomain_adj,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 6823b0c7d250SStefano Zampini ierr = MatSetOption(subdomain_adj,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 6824b0c7d250SStefano Zampini row = nrank; 6825b0c7d250SStefano Zampini ncols = xadj[1]-xadj[0]; 6826b0c7d250SStefano Zampini cols = adjncy; 6827b0c7d250SStefano Zampini ierr = PetscMalloc1(ncols,&vals);CHKERRQ(ierr); 6828b0c7d250SStefano Zampini for (i=0;i<ncols;i++) vals[i] = adjncy_wgt[i]; 6829b0c7d250SStefano Zampini ierr = MatSetValues(subdomain_adj,1,&row,ncols,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 6830b0c7d250SStefano Zampini ierr = MatAssemblyBegin(subdomain_adj,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 6831b0c7d250SStefano Zampini ierr = MatAssemblyEnd(subdomain_adj,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 683252e5ac9dSStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 683352e5ac9dSStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 683452e5ac9dSStefano Zampini ierr = PetscFree(adjncy_wgt);CHKERRQ(ierr); 6835b0c7d250SStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 683627b6a85dSStefano Zampini if (use_vwgt) { 683727b6a85dSStefano Zampini Vec v; 683827b6a85dSStefano Zampini const PetscScalar *array; 683927b6a85dSStefano Zampini PetscInt nl; 684027b6a85dSStefano Zampini 684127b6a85dSStefano Zampini ierr = MatCreateVecs(subdomain_adj,&v,NULL);CHKERRQ(ierr); 6842bb360cb4SStefano Zampini ierr = VecSetValue(v,row,(PetscScalar)n,INSERT_VALUES);CHKERRQ(ierr); 684327b6a85dSStefano Zampini ierr = VecAssemblyBegin(v);CHKERRQ(ierr); 684427b6a85dSStefano Zampini ierr = VecAssemblyEnd(v);CHKERRQ(ierr); 684527b6a85dSStefano Zampini ierr = VecGetLocalSize(v,&nl);CHKERRQ(ierr); 684627b6a85dSStefano Zampini ierr = VecGetArrayRead(v,&array);CHKERRQ(ierr); 684727b6a85dSStefano Zampini ierr = PetscMalloc1(nl,&v_wgt);CHKERRQ(ierr); 684822db5ddcSStefano Zampini for (i=0;i<nl;i++) v_wgt[i] = (PetscInt)PetscRealPart(array[i]); 684927b6a85dSStefano Zampini ierr = VecRestoreArrayRead(v,&array);CHKERRQ(ierr); 685027b6a85dSStefano Zampini ierr = VecDestroy(&v);CHKERRQ(ierr); 685127b6a85dSStefano Zampini } 6852b0c7d250SStefano Zampini } else { 685327b6a85dSStefano Zampini ierr = MatCreateMPIAdj(subcomm,1,(PetscInt)size,xadj,adjncy,adjncy_wgt,&subdomain_adj);CHKERRQ(ierr); 685427b6a85dSStefano Zampini if (use_vwgt) { 685527b6a85dSStefano Zampini ierr = PetscMalloc1(1,&v_wgt);CHKERRQ(ierr); 6856bb360cb4SStefano Zampini v_wgt[0] = n; 685727b6a85dSStefano Zampini } 6858b0c7d250SStefano Zampini } 685922b6e8a2SStefano Zampini /* ierr = MatView(subdomain_adj,0);CHKERRQ(ierr); */ 6860e7931f94SStefano Zampini 6861e7931f94SStefano Zampini /* Partition */ 686227b6a85dSStefano Zampini ierr = MatPartitioningCreate(subcomm,&partitioner);CHKERRQ(ierr); 6863e7931f94SStefano Zampini ierr = MatPartitioningSetAdjacency(partitioner,subdomain_adj);CHKERRQ(ierr); 686427b6a85dSStefano Zampini if (v_wgt) { 6865e7931f94SStefano Zampini ierr = MatPartitioningSetVertexWeights(partitioner,v_wgt);CHKERRQ(ierr); 6866c8587f34SStefano Zampini } 686757de7509SStefano Zampini *n_subdomains = PetscMin((PetscInt)size,*n_subdomains); 686857de7509SStefano Zampini ierr = MatPartitioningSetNParts(partitioner,*n_subdomains);CHKERRQ(ierr); 6869e7931f94SStefano Zampini ierr = MatPartitioningSetFromOptions(partitioner);CHKERRQ(ierr); 6870e7931f94SStefano Zampini ierr = MatPartitioningApply(partitioner,&new_ranks);CHKERRQ(ierr); 687122b6e8a2SStefano Zampini /* ierr = MatPartitioningView(partitioner,0);CHKERRQ(ierr); */ 6872e7931f94SStefano Zampini 687352e5ac9dSStefano Zampini /* renumber new_ranks to avoid "holes" in new set of processors */ 68746583bcc1SStefano Zampini ierr = ISRenumber(new_ranks,NULL,NULL,&new_ranks_contig);CHKERRQ(ierr); 687552e5ac9dSStefano Zampini ierr = ISDestroy(&new_ranks);CHKERRQ(ierr); 687652e5ac9dSStefano Zampini ierr = ISGetIndices(new_ranks_contig,(const PetscInt**)&is_indices);CHKERRQ(ierr); 687757de7509SStefano Zampini if (!aggregate) { 687857de7509SStefano Zampini if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */ 687927b6a85dSStefano Zampini #if defined(PETSC_USE_DEBUG) 688027b6a85dSStefano Zampini if (!oldranks) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen"); 688127b6a85dSStefano Zampini #endif 688257de7509SStefano Zampini ranks_send_to_idx[0] = procs_candidates[oldranks[is_indices[0]]]; 688327b6a85dSStefano Zampini } else if (oldranks) { 6884b0c7d250SStefano Zampini ranks_send_to_idx[0] = oldranks[is_indices[0]]; 688527b6a85dSStefano Zampini } else { 688627b6a85dSStefano Zampini ranks_send_to_idx[0] = is_indices[0]; 688757de7509SStefano Zampini } 688828143c3dSStefano Zampini } else { 6889*7fb8a5e4SKarl Rupp PetscInt idx = 0; 6890b0c7d250SStefano Zampini PetscMPIInt tag; 6891b0c7d250SStefano Zampini MPI_Request *reqs; 6892b0c7d250SStefano Zampini 6893b0c7d250SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)subdomain_adj,&tag);CHKERRQ(ierr); 6894b0c7d250SStefano Zampini ierr = PetscMalloc1(rend-rstart,&reqs);CHKERRQ(ierr); 6895b0c7d250SStefano Zampini for (i=rstart;i<rend;i++) { 689627b6a85dSStefano Zampini ierr = MPI_Isend(is_indices+i-rstart,1,MPIU_INT,i,tag,subcomm,&reqs[i-rstart]);CHKERRQ(ierr); 689728143c3dSStefano Zampini } 6898*7fb8a5e4SKarl Rupp ierr = MPI_Recv(&idx,1,MPIU_INT,MPI_ANY_SOURCE,tag,subcomm,MPI_STATUS_IGNORE);CHKERRQ(ierr); 6899b0c7d250SStefano Zampini ierr = MPI_Waitall(rend-rstart,reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 6900b0c7d250SStefano Zampini ierr = PetscFree(reqs);CHKERRQ(ierr); 690157de7509SStefano Zampini if (procs_candidates) { /* shift the pattern on non-active candidates (if any) */ 690227b6a85dSStefano Zampini #if defined(PETSC_USE_DEBUG) 690327b6a85dSStefano Zampini if (!oldranks) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"This should not happen"); 690427b6a85dSStefano Zampini #endif 6905*7fb8a5e4SKarl Rupp ranks_send_to_idx[0] = procs_candidates[oldranks[idx]]; 690627b6a85dSStefano Zampini } else if (oldranks) { 6907*7fb8a5e4SKarl Rupp ranks_send_to_idx[0] = oldranks[idx]; 690827b6a85dSStefano Zampini } else { 6909*7fb8a5e4SKarl Rupp ranks_send_to_idx[0] = idx; 6910e7931f94SStefano Zampini } 691157de7509SStefano Zampini } 691252e5ac9dSStefano Zampini ierr = ISRestoreIndices(new_ranks_contig,(const PetscInt**)&is_indices);CHKERRQ(ierr); 6913e7931f94SStefano Zampini /* clean up */ 6914e7931f94SStefano Zampini ierr = PetscFree(oldranks);CHKERRQ(ierr); 691552e5ac9dSStefano Zampini ierr = ISDestroy(&new_ranks_contig);CHKERRQ(ierr); 6916e7931f94SStefano Zampini ierr = MatDestroy(&subdomain_adj);CHKERRQ(ierr); 6917e7931f94SStefano Zampini ierr = MatPartitioningDestroy(&partitioner);CHKERRQ(ierr); 6918e7931f94SStefano Zampini } 691927b6a85dSStefano Zampini ierr = PetscSubcommDestroy(&psubcomm);CHKERRQ(ierr); 692057de7509SStefano Zampini ierr = PetscFree(procs_candidates);CHKERRQ(ierr); 6921e7931f94SStefano Zampini 6922e7931f94SStefano Zampini /* assemble parallel IS for sends */ 6923e7931f94SStefano Zampini i = 1; 692427b6a85dSStefano Zampini if (!color) i=0; 692557de7509SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)mat),i,ranks_send_to_idx,PETSC_OWN_POINTER,is_sends);CHKERRQ(ierr); 6926e7931f94SStefano Zampini PetscFunctionReturn(0); 6927e7931f94SStefano Zampini } 6928e7931f94SStefano Zampini 6929e7931f94SStefano Zampini typedef enum {MATDENSE_PRIVATE=0,MATAIJ_PRIVATE,MATBAIJ_PRIVATE,MATSBAIJ_PRIVATE}MatTypePrivate; 6930e7931f94SStefano Zampini 69311e0482f5SStefano Zampini PetscErrorCode PCBDDCMatISSubassemble(Mat mat, IS is_sends, PetscInt n_subdomains, PetscBool restrict_comm, PetscBool restrict_full, PetscBool reuse, Mat *mat_n, PetscInt nis, IS isarray[], PetscInt nvecs, Vec nnsp_vec[]) 6932e7931f94SStefano Zampini { 693370cf5478SStefano Zampini Mat local_mat; 6934e7931f94SStefano Zampini IS is_sends_internal; 69359d30be91SStefano Zampini PetscInt rows,cols,new_local_rows; 69361ae86dd6SStefano Zampini PetscInt i,bs,buf_size_idxs,buf_size_idxs_is,buf_size_vals,buf_size_vecs; 69379d30be91SStefano Zampini PetscBool ismatis,isdense,newisdense,destroy_mat; 6938e7931f94SStefano Zampini ISLocalToGlobalMapping l2gmap; 6939e7931f94SStefano Zampini PetscInt* l2gmap_indices; 6940e7931f94SStefano Zampini const PetscInt* is_indices; 6941e7931f94SStefano Zampini MatType new_local_type; 6942e7931f94SStefano Zampini /* buffers */ 6943e7931f94SStefano Zampini PetscInt *ptr_idxs,*send_buffer_idxs,*recv_buffer_idxs; 694428143c3dSStefano Zampini PetscInt *ptr_idxs_is,*send_buffer_idxs_is,*recv_buffer_idxs_is; 69459d30be91SStefano Zampini PetscInt *recv_buffer_idxs_local; 6946e7931f94SStefano Zampini PetscScalar *ptr_vals,*send_buffer_vals,*recv_buffer_vals; 69471ae86dd6SStefano Zampini PetscScalar *ptr_vecs,*send_buffer_vecs,*recv_buffer_vecs; 6948e7931f94SStefano Zampini /* MPI */ 694928143c3dSStefano Zampini MPI_Comm comm,comm_n; 695028143c3dSStefano Zampini PetscSubcomm subcomm; 6951e7931f94SStefano Zampini PetscMPIInt n_sends,n_recvs,commsize; 695228143c3dSStefano Zampini PetscMPIInt *iflags,*ilengths_idxs,*ilengths_vals,*ilengths_idxs_is; 695328143c3dSStefano Zampini PetscMPIInt *onodes,*onodes_is,*olengths_idxs,*olengths_idxs_is,*olengths_vals; 69541ae86dd6SStefano Zampini PetscMPIInt len,tag_idxs,tag_idxs_is,tag_vals,tag_vecs,source_dest; 69551ae86dd6SStefano Zampini MPI_Request *send_req_idxs,*send_req_idxs_is,*send_req_vals,*send_req_vecs; 69561ae86dd6SStefano Zampini MPI_Request *recv_req_idxs,*recv_req_idxs_is,*recv_req_vals,*recv_req_vecs; 6957e7931f94SStefano Zampini PetscErrorCode ierr; 6958e7931f94SStefano Zampini 6959e7931f94SStefano Zampini PetscFunctionBegin; 696057de7509SStefano Zampini PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 6961e7931f94SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)mat,MATIS,&ismatis);CHKERRQ(ierr); 6962fbfcfee5SBarry Smith if (!ismatis) SETERRQ1(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot use %s on a matrix object which is not of type MATIS",PETSC_FUNCTION_NAME); 696357de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,n_subdomains,3); 696457de7509SStefano Zampini PetscValidLogicalCollectiveBool(mat,restrict_comm,4); 696557de7509SStefano Zampini PetscValidLogicalCollectiveBool(mat,restrict_full,5); 696657de7509SStefano Zampini PetscValidLogicalCollectiveBool(mat,reuse,6); 696757de7509SStefano Zampini PetscValidLogicalCollectiveInt(mat,nis,8); 69681ae86dd6SStefano Zampini PetscValidLogicalCollectiveInt(mat,nvecs,10); 69691ae86dd6SStefano Zampini if (nvecs) { 69701ae86dd6SStefano Zampini if (nvecs > 1) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Just 1 vector supported"); 69711ae86dd6SStefano Zampini PetscValidHeaderSpecific(nnsp_vec[0],VEC_CLASSID,11); 69721ae86dd6SStefano Zampini } 697357de7509SStefano Zampini /* further checks */ 6974e7931f94SStefano Zampini ierr = MatISGetLocalMat(mat,&local_mat);CHKERRQ(ierr); 6975e7931f94SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)local_mat,MATSEQDENSE,&isdense);CHKERRQ(ierr); 6976e7931f94SStefano Zampini if (!isdense) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Currently cannot subassemble MATIS when local matrix type is not of type SEQDENSE"); 6977e7931f94SStefano Zampini ierr = MatGetSize(local_mat,&rows,&cols);CHKERRQ(ierr); 6978e7931f94SStefano Zampini if (rows != cols) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Local MATIS matrices should be square"); 697957de7509SStefano Zampini if (reuse && *mat_n) { 698070cf5478SStefano Zampini PetscInt mrows,mcols,mnrows,mncols; 698157de7509SStefano Zampini PetscValidHeaderSpecific(*mat_n,MAT_CLASSID,7); 698270cf5478SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)*mat_n,MATIS,&ismatis);CHKERRQ(ierr); 698328143c3dSStefano Zampini if (!ismatis) SETERRQ(PetscObjectComm((PetscObject)*mat_n),PETSC_ERR_SUP,"Cannot reuse a matrix which is not of type MATIS"); 698470cf5478SStefano Zampini ierr = MatGetSize(mat,&mrows,&mcols);CHKERRQ(ierr); 698570cf5478SStefano Zampini ierr = MatGetSize(*mat_n,&mnrows,&mncols);CHKERRQ(ierr); 698670cf5478SStefano Zampini if (mrows != mnrows) SETERRQ2(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot reuse matrix! Wrong number of rows %D != %D",mrows,mnrows); 698770cf5478SStefano Zampini if (mcols != mncols) SETERRQ2(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Cannot reuse matrix! Wrong number of cols %D != %D",mcols,mncols); 698870cf5478SStefano Zampini } 6989e7931f94SStefano Zampini ierr = MatGetBlockSize(local_mat,&bs);CHKERRQ(ierr); 6990e7931f94SStefano Zampini PetscValidLogicalCollectiveInt(mat,bs,0); 699157de7509SStefano Zampini 6992e7931f94SStefano Zampini /* prepare IS for sending if not provided */ 6993e7931f94SStefano Zampini if (!is_sends) { 699428143c3dSStefano Zampini if (!n_subdomains) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"You should specify either an IS or a target number of subdomains"); 6995bb360cb4SStefano Zampini ierr = PCBDDCMatISGetSubassemblingPattern(mat,&n_subdomains,0,&is_sends_internal,NULL);CHKERRQ(ierr); 6996c8587f34SStefano Zampini } else { 6997e7931f94SStefano Zampini ierr = PetscObjectReference((PetscObject)is_sends);CHKERRQ(ierr); 6998e7931f94SStefano Zampini is_sends_internal = is_sends; 6999c8587f34SStefano Zampini } 7000e7931f94SStefano Zampini 7001e7931f94SStefano Zampini /* get comm */ 7002a316fed8SStefano Zampini ierr = PetscObjectGetComm((PetscObject)mat,&comm);CHKERRQ(ierr); 7003e7931f94SStefano Zampini 7004e7931f94SStefano Zampini /* compute number of sends */ 7005e7931f94SStefano Zampini ierr = ISGetLocalSize(is_sends_internal,&i);CHKERRQ(ierr); 7006e7931f94SStefano Zampini ierr = PetscMPIIntCast(i,&n_sends);CHKERRQ(ierr); 7007e7931f94SStefano Zampini 7008e7931f94SStefano Zampini /* compute number of receives */ 7009e7931f94SStefano Zampini ierr = MPI_Comm_size(comm,&commsize);CHKERRQ(ierr); 7010785e854fSJed Brown ierr = PetscMalloc1(commsize,&iflags);CHKERRQ(ierr); 7011e7931f94SStefano Zampini ierr = PetscMemzero(iflags,commsize*sizeof(*iflags));CHKERRQ(ierr); 7012e7931f94SStefano Zampini ierr = ISGetIndices(is_sends_internal,&is_indices);CHKERRQ(ierr); 7013e7931f94SStefano Zampini for (i=0;i<n_sends;i++) iflags[is_indices[i]] = 1; 7014e7931f94SStefano Zampini ierr = PetscGatherNumberOfMessages(comm,iflags,NULL,&n_recvs);CHKERRQ(ierr); 7015e7931f94SStefano Zampini ierr = PetscFree(iflags);CHKERRQ(ierr); 7016e7931f94SStefano Zampini 701728143c3dSStefano Zampini /* restrict comm if requested */ 701828143c3dSStefano Zampini subcomm = 0; 701928143c3dSStefano Zampini destroy_mat = PETSC_FALSE; 702028143c3dSStefano Zampini if (restrict_comm) { 7021779c1cceSStefano Zampini PetscMPIInt color,subcommsize; 7022779c1cceSStefano Zampini 702328143c3dSStefano Zampini color = 0; 702453a05cb3SStefano Zampini if (restrict_full) { 702553a05cb3SStefano Zampini if (!n_recvs) color = 1; /* processes not receiving anything will not partecipate in new comm (full restriction) */ 702653a05cb3SStefano Zampini } else { 702753a05cb3SStefano Zampini if (!n_recvs && n_sends) color = 1; /* just those processes that are sending but not receiving anything will not partecipate in new comm */ 702853a05cb3SStefano Zampini } 7029b2566f29SBarry Smith ierr = MPIU_Allreduce(&color,&subcommsize,1,MPI_INT,MPI_SUM,comm);CHKERRQ(ierr); 703028143c3dSStefano Zampini subcommsize = commsize - subcommsize; 703128143c3dSStefano Zampini /* check if reuse has been requested */ 703257de7509SStefano Zampini if (reuse) { 703328143c3dSStefano Zampini if (*mat_n) { 703428143c3dSStefano Zampini PetscMPIInt subcommsize2; 703528143c3dSStefano Zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)*mat_n),&subcommsize2);CHKERRQ(ierr); 703628143c3dSStefano Zampini if (subcommsize != subcommsize2) SETERRQ2(PetscObjectComm((PetscObject)*mat_n),PETSC_ERR_PLIB,"Cannot reuse matrix! wrong subcomm size %d != %d",subcommsize,subcommsize2); 703728143c3dSStefano Zampini comm_n = PetscObjectComm((PetscObject)*mat_n); 703828143c3dSStefano Zampini } else { 703928143c3dSStefano Zampini comm_n = PETSC_COMM_SELF; 704028143c3dSStefano Zampini } 704128143c3dSStefano Zampini } else { /* MAT_INITIAL_MATRIX */ 7042779c1cceSStefano Zampini PetscMPIInt rank; 7043779c1cceSStefano Zampini 7044779c1cceSStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 704528143c3dSStefano Zampini ierr = PetscSubcommCreate(comm,&subcomm);CHKERRQ(ierr); 704628143c3dSStefano Zampini ierr = PetscSubcommSetNumber(subcomm,2);CHKERRQ(ierr); 704728143c3dSStefano Zampini ierr = PetscSubcommSetTypeGeneral(subcomm,color,rank);CHKERRQ(ierr); 7048306c2d5bSBarry Smith comm_n = PetscSubcommChild(subcomm); 704928143c3dSStefano Zampini } 705028143c3dSStefano Zampini /* flag to destroy *mat_n if not significative */ 705128143c3dSStefano Zampini if (color) destroy_mat = PETSC_TRUE; 705228143c3dSStefano Zampini } else { 705328143c3dSStefano Zampini comm_n = comm; 705428143c3dSStefano Zampini } 705528143c3dSStefano Zampini 7056e7931f94SStefano Zampini /* prepare send/receive buffers */ 7057785e854fSJed Brown ierr = PetscMalloc1(commsize,&ilengths_idxs);CHKERRQ(ierr); 7058e7931f94SStefano Zampini ierr = PetscMemzero(ilengths_idxs,commsize*sizeof(*ilengths_idxs));CHKERRQ(ierr); 7059785e854fSJed Brown ierr = PetscMalloc1(commsize,&ilengths_vals);CHKERRQ(ierr); 7060e7931f94SStefano Zampini ierr = PetscMemzero(ilengths_vals,commsize*sizeof(*ilengths_vals));CHKERRQ(ierr); 706128143c3dSStefano Zampini if (nis) { 7062854ce69bSBarry Smith ierr = PetscCalloc1(commsize,&ilengths_idxs_is);CHKERRQ(ierr); 706328143c3dSStefano Zampini } 7064e7931f94SStefano Zampini 706528143c3dSStefano Zampini /* Get data from local matrices */ 70666c4ed002SBarry Smith if (!isdense) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"Subassembling of AIJ local matrices not yet implemented"); 7067e7931f94SStefano Zampini /* TODO: See below some guidelines on how to prepare the local buffers */ 7068e7931f94SStefano Zampini /* 7069e7931f94SStefano Zampini send_buffer_vals should contain the raw values of the local matrix 7070e7931f94SStefano Zampini send_buffer_idxs should contain: 7071e7931f94SStefano Zampini - MatType_PRIVATE type 7072e7931f94SStefano Zampini - PetscInt size_of_l2gmap 7073e7931f94SStefano Zampini - PetscInt global_row_indices[size_of_l2gmap] 7074e7931f94SStefano Zampini - PetscInt all_other_info_which_is_needed_to_compute_preallocation_and_set_values 7075e7931f94SStefano Zampini */ 70766c4ed002SBarry Smith else { 7077e7931f94SStefano Zampini ierr = MatDenseGetArray(local_mat,&send_buffer_vals);CHKERRQ(ierr); 70783bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingGetSize(mat->rmap->mapping,&i);CHKERRQ(ierr); 7079854ce69bSBarry Smith ierr = PetscMalloc1(i+2,&send_buffer_idxs);CHKERRQ(ierr); 7080e7931f94SStefano Zampini send_buffer_idxs[0] = (PetscInt)MATDENSE_PRIVATE; 7081e7931f94SStefano Zampini send_buffer_idxs[1] = i; 70823bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(mat->rmap->mapping,(const PetscInt**)&ptr_idxs);CHKERRQ(ierr); 7083e7931f94SStefano Zampini ierr = PetscMemcpy(&send_buffer_idxs[2],ptr_idxs,i*sizeof(PetscInt));CHKERRQ(ierr); 70843bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(mat->rmap->mapping,(const PetscInt**)&ptr_idxs);CHKERRQ(ierr); 7085e7931f94SStefano Zampini ierr = PetscMPIIntCast(i,&len);CHKERRQ(ierr); 7086e7931f94SStefano Zampini for (i=0;i<n_sends;i++) { 7087e7931f94SStefano Zampini ilengths_vals[is_indices[i]] = len*len; 7088e7931f94SStefano Zampini ilengths_idxs[is_indices[i]] = len+2; 7089c8587f34SStefano Zampini } 7090c8587f34SStefano Zampini } 7091e7931f94SStefano Zampini ierr = PetscGatherMessageLengths2(comm,n_sends,n_recvs,ilengths_idxs,ilengths_vals,&onodes,&olengths_idxs,&olengths_vals);CHKERRQ(ierr); 709228143c3dSStefano Zampini /* additional is (if any) */ 709328143c3dSStefano Zampini if (nis) { 709428143c3dSStefano Zampini PetscMPIInt psum; 709528143c3dSStefano Zampini PetscInt j; 709628143c3dSStefano Zampini for (j=0,psum=0;j<nis;j++) { 709728143c3dSStefano Zampini PetscInt plen; 709828143c3dSStefano Zampini ierr = ISGetLocalSize(isarray[j],&plen);CHKERRQ(ierr); 709928143c3dSStefano Zampini ierr = PetscMPIIntCast(plen,&len);CHKERRQ(ierr); 710028143c3dSStefano Zampini psum += len+1; /* indices + lenght */ 710128143c3dSStefano Zampini } 7102854ce69bSBarry Smith ierr = PetscMalloc1(psum,&send_buffer_idxs_is);CHKERRQ(ierr); 710328143c3dSStefano Zampini for (j=0,psum=0;j<nis;j++) { 710428143c3dSStefano Zampini PetscInt plen; 710528143c3dSStefano Zampini const PetscInt *is_array_idxs; 710628143c3dSStefano Zampini ierr = ISGetLocalSize(isarray[j],&plen);CHKERRQ(ierr); 710728143c3dSStefano Zampini send_buffer_idxs_is[psum] = plen; 710828143c3dSStefano Zampini ierr = ISGetIndices(isarray[j],&is_array_idxs);CHKERRQ(ierr); 710928143c3dSStefano Zampini ierr = PetscMemcpy(&send_buffer_idxs_is[psum+1],is_array_idxs,plen*sizeof(PetscInt));CHKERRQ(ierr); 711028143c3dSStefano Zampini ierr = ISRestoreIndices(isarray[j],&is_array_idxs);CHKERRQ(ierr); 711128143c3dSStefano Zampini psum += plen+1; /* indices + lenght */ 711228143c3dSStefano Zampini } 711328143c3dSStefano Zampini for (i=0;i<n_sends;i++) { 711428143c3dSStefano Zampini ilengths_idxs_is[is_indices[i]] = psum; 711528143c3dSStefano Zampini } 711628143c3dSStefano Zampini ierr = PetscGatherMessageLengths(comm,n_sends,n_recvs,ilengths_idxs_is,&onodes_is,&olengths_idxs_is);CHKERRQ(ierr); 711728143c3dSStefano Zampini } 71183b3b1effSJed Brown ierr = MatISRestoreLocalMat(mat,&local_mat);CHKERRQ(ierr); 711928143c3dSStefano Zampini 7120e7931f94SStefano Zampini buf_size_idxs = 0; 7121e7931f94SStefano Zampini buf_size_vals = 0; 712228143c3dSStefano Zampini buf_size_idxs_is = 0; 71231ae86dd6SStefano Zampini buf_size_vecs = 0; 7124e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7125e7931f94SStefano Zampini buf_size_idxs += (PetscInt)olengths_idxs[i]; 7126e7931f94SStefano Zampini buf_size_vals += (PetscInt)olengths_vals[i]; 712728143c3dSStefano Zampini if (nis) buf_size_idxs_is += (PetscInt)olengths_idxs_is[i]; 71281ae86dd6SStefano Zampini if (nvecs) buf_size_vecs += (PetscInt)olengths_idxs[i]; 7129e7931f94SStefano Zampini } 7130785e854fSJed Brown ierr = PetscMalloc1(buf_size_idxs,&recv_buffer_idxs);CHKERRQ(ierr); 7131785e854fSJed Brown ierr = PetscMalloc1(buf_size_vals,&recv_buffer_vals);CHKERRQ(ierr); 713295ecbf38SStefano Zampini ierr = PetscMalloc1(buf_size_idxs_is,&recv_buffer_idxs_is);CHKERRQ(ierr); 71331ae86dd6SStefano Zampini ierr = PetscMalloc1(buf_size_vecs,&recv_buffer_vecs);CHKERRQ(ierr); 7134e7931f94SStefano Zampini 7135e7931f94SStefano Zampini /* get new tags for clean communications */ 7136e7931f94SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_idxs);CHKERRQ(ierr); 7137e7931f94SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_vals);CHKERRQ(ierr); 713828143c3dSStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_idxs_is);CHKERRQ(ierr); 71391ae86dd6SStefano Zampini ierr = PetscObjectGetNewTag((PetscObject)mat,&tag_vecs);CHKERRQ(ierr); 7140e7931f94SStefano Zampini 7141e7931f94SStefano Zampini /* allocate for requests */ 7142785e854fSJed Brown ierr = PetscMalloc1(n_sends,&send_req_idxs);CHKERRQ(ierr); 7143785e854fSJed Brown ierr = PetscMalloc1(n_sends,&send_req_vals);CHKERRQ(ierr); 714495ecbf38SStefano Zampini ierr = PetscMalloc1(n_sends,&send_req_idxs_is);CHKERRQ(ierr); 71451ae86dd6SStefano Zampini ierr = PetscMalloc1(n_sends,&send_req_vecs);CHKERRQ(ierr); 7146785e854fSJed Brown ierr = PetscMalloc1(n_recvs,&recv_req_idxs);CHKERRQ(ierr); 7147785e854fSJed Brown ierr = PetscMalloc1(n_recvs,&recv_req_vals);CHKERRQ(ierr); 714895ecbf38SStefano Zampini ierr = PetscMalloc1(n_recvs,&recv_req_idxs_is);CHKERRQ(ierr); 71491ae86dd6SStefano Zampini ierr = PetscMalloc1(n_recvs,&recv_req_vecs);CHKERRQ(ierr); 7150e7931f94SStefano Zampini 7151e7931f94SStefano Zampini /* communications */ 7152e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 7153e7931f94SStefano Zampini ptr_vals = recv_buffer_vals; 715428143c3dSStefano Zampini ptr_idxs_is = recv_buffer_idxs_is; 71551ae86dd6SStefano Zampini ptr_vecs = recv_buffer_vecs; 7156e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7157e7931f94SStefano Zampini source_dest = onodes[i]; 7158e7931f94SStefano Zampini ierr = MPI_Irecv(ptr_idxs,olengths_idxs[i],MPIU_INT,source_dest,tag_idxs,comm,&recv_req_idxs[i]);CHKERRQ(ierr); 7159e7931f94SStefano Zampini ierr = MPI_Irecv(ptr_vals,olengths_vals[i],MPIU_SCALAR,source_dest,tag_vals,comm,&recv_req_vals[i]);CHKERRQ(ierr); 7160e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7161e7931f94SStefano Zampini ptr_vals += olengths_vals[i]; 716228143c3dSStefano Zampini if (nis) { 716357de7509SStefano Zampini source_dest = onodes_is[i]; 716428143c3dSStefano Zampini ierr = MPI_Irecv(ptr_idxs_is,olengths_idxs_is[i],MPIU_INT,source_dest,tag_idxs_is,comm,&recv_req_idxs_is[i]);CHKERRQ(ierr); 716528143c3dSStefano Zampini ptr_idxs_is += olengths_idxs_is[i]; 716628143c3dSStefano Zampini } 71671ae86dd6SStefano Zampini if (nvecs) { 71681ae86dd6SStefano Zampini source_dest = onodes[i]; 71691ae86dd6SStefano Zampini ierr = MPI_Irecv(ptr_vecs,olengths_idxs[i]-2,MPIU_SCALAR,source_dest,tag_vecs,comm,&recv_req_vecs[i]);CHKERRQ(ierr); 71701ae86dd6SStefano Zampini ptr_vecs += olengths_idxs[i]-2; 71711ae86dd6SStefano Zampini } 7172e7931f94SStefano Zampini } 7173e7931f94SStefano Zampini for (i=0;i<n_sends;i++) { 7174e7931f94SStefano Zampini ierr = PetscMPIIntCast(is_indices[i],&source_dest);CHKERRQ(ierr); 7175e7931f94SStefano Zampini ierr = MPI_Isend(send_buffer_idxs,ilengths_idxs[source_dest],MPIU_INT,source_dest,tag_idxs,comm,&send_req_idxs[i]);CHKERRQ(ierr); 7176e7931f94SStefano Zampini ierr = MPI_Isend(send_buffer_vals,ilengths_vals[source_dest],MPIU_SCALAR,source_dest,tag_vals,comm,&send_req_vals[i]);CHKERRQ(ierr); 717728143c3dSStefano Zampini if (nis) { 717828143c3dSStefano Zampini ierr = MPI_Isend(send_buffer_idxs_is,ilengths_idxs_is[source_dest],MPIU_INT,source_dest,tag_idxs_is,comm,&send_req_idxs_is[i]);CHKERRQ(ierr); 717928143c3dSStefano Zampini } 71801ae86dd6SStefano Zampini if (nvecs) { 71811ae86dd6SStefano Zampini ierr = VecGetArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 71821ae86dd6SStefano Zampini ierr = MPI_Isend(send_buffer_vecs,ilengths_idxs[source_dest]-2,MPIU_SCALAR,source_dest,tag_vecs,comm,&send_req_vecs[i]);CHKERRQ(ierr); 71831ae86dd6SStefano Zampini } 7184e7931f94SStefano Zampini } 7185e7931f94SStefano Zampini ierr = ISRestoreIndices(is_sends_internal,&is_indices);CHKERRQ(ierr); 7186e7931f94SStefano Zampini ierr = ISDestroy(&is_sends_internal);CHKERRQ(ierr); 7187e7931f94SStefano Zampini 7188e7931f94SStefano Zampini /* assemble new l2g map */ 7189e7931f94SStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_idxs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7190e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 71919d30be91SStefano Zampini new_local_rows = 0; 7192e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 71939d30be91SStefano Zampini new_local_rows += *(ptr_idxs+1); /* second element is the local size of the l2gmap */ 7194e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7195e7931f94SStefano Zampini } 71969d30be91SStefano Zampini ierr = PetscMalloc1(new_local_rows,&l2gmap_indices);CHKERRQ(ierr); 7197e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 71989d30be91SStefano Zampini new_local_rows = 0; 7199e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 72009d30be91SStefano Zampini ierr = PetscMemcpy(&l2gmap_indices[new_local_rows],ptr_idxs+2,(*(ptr_idxs+1))*sizeof(PetscInt));CHKERRQ(ierr); 72019d30be91SStefano Zampini new_local_rows += *(ptr_idxs+1); /* second element is the local size of the l2gmap */ 7202e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7203e7931f94SStefano Zampini } 72049d30be91SStefano Zampini ierr = PetscSortRemoveDupsInt(&new_local_rows,l2gmap_indices);CHKERRQ(ierr); 72059d30be91SStefano Zampini ierr = ISLocalToGlobalMappingCreate(comm_n,1,new_local_rows,l2gmap_indices,PETSC_COPY_VALUES,&l2gmap);CHKERRQ(ierr); 7206e7931f94SStefano Zampini ierr = PetscFree(l2gmap_indices);CHKERRQ(ierr); 7207e7931f94SStefano Zampini 7208e7931f94SStefano Zampini /* infer new local matrix type from received local matrices type */ 7209e7931f94SStefano Zampini /* currently if all local matrices are of type X, then the resulting matrix will be of type X, except for the dense case */ 7210e7931f94SStefano Zampini /* it also assumes that if the block size is set, than it is the same among all local matrices (see checks at the beginning of the function) */ 7211e7931f94SStefano Zampini if (n_recvs) { 721228143c3dSStefano Zampini MatTypePrivate new_local_type_private = (MatTypePrivate)send_buffer_idxs[0]; 7213e7931f94SStefano Zampini ptr_idxs = recv_buffer_idxs; 7214e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7215e7931f94SStefano Zampini if ((PetscInt)new_local_type_private != *ptr_idxs) { 7216e7931f94SStefano Zampini new_local_type_private = MATAIJ_PRIVATE; 7217e7931f94SStefano Zampini break; 7218e7931f94SStefano Zampini } 7219e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7220e7931f94SStefano Zampini } 7221e7931f94SStefano Zampini switch (new_local_type_private) { 722228143c3dSStefano Zampini case MATDENSE_PRIVATE: 7223e7931f94SStefano Zampini new_local_type = MATSEQAIJ; 7224e7931f94SStefano Zampini bs = 1; 7225e7931f94SStefano Zampini break; 7226e7931f94SStefano Zampini case MATAIJ_PRIVATE: 7227e7931f94SStefano Zampini new_local_type = MATSEQAIJ; 7228e7931f94SStefano Zampini bs = 1; 7229e7931f94SStefano Zampini break; 7230e7931f94SStefano Zampini case MATBAIJ_PRIVATE: 7231e7931f94SStefano Zampini new_local_type = MATSEQBAIJ; 7232e7931f94SStefano Zampini break; 7233e7931f94SStefano Zampini case MATSBAIJ_PRIVATE: 7234e7931f94SStefano Zampini new_local_type = MATSEQSBAIJ; 7235e7931f94SStefano Zampini break; 7236e7931f94SStefano Zampini default: 7237fbfcfee5SBarry Smith SETERRQ2(comm,PETSC_ERR_SUP,"Unsupported private type %d in %s",new_local_type_private,PETSC_FUNCTION_NAME); 7238e7931f94SStefano Zampini break; 7239e7931f94SStefano Zampini } 7240ed8ed4edSstefano_zampini } else { /* by default, new_local_type is seqaij */ 7241ed8ed4edSstefano_zampini new_local_type = MATSEQAIJ; 724228143c3dSStefano Zampini bs = 1; 7243e7931f94SStefano Zampini } 7244e7931f94SStefano Zampini 724570cf5478SStefano Zampini /* create MATIS object if needed */ 724657de7509SStefano Zampini if (!reuse) { 7247e7931f94SStefano Zampini ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 7248e176bc59SStefano Zampini ierr = MatCreateIS(comm_n,bs,PETSC_DECIDE,PETSC_DECIDE,rows,cols,l2gmap,NULL,mat_n);CHKERRQ(ierr); 724970cf5478SStefano Zampini } else { 725070cf5478SStefano Zampini /* it also destroys the local matrices */ 725157de7509SStefano Zampini if (*mat_n) { 725270cf5478SStefano Zampini ierr = MatSetLocalToGlobalMapping(*mat_n,l2gmap,l2gmap);CHKERRQ(ierr); 725357de7509SStefano Zampini } else { /* this is a fake object */ 725457de7509SStefano Zampini ierr = MatCreateIS(comm_n,bs,PETSC_DECIDE,PETSC_DECIDE,rows,cols,l2gmap,NULL,mat_n);CHKERRQ(ierr); 725557de7509SStefano Zampini } 725670cf5478SStefano Zampini } 725770cf5478SStefano Zampini ierr = MatISGetLocalMat(*mat_n,&local_mat);CHKERRQ(ierr); 7258e7931f94SStefano Zampini ierr = MatSetType(local_mat,new_local_type);CHKERRQ(ierr); 72599d30be91SStefano Zampini 72609d30be91SStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_vals,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 72619d30be91SStefano Zampini 72629d30be91SStefano Zampini /* Global to local map of received indices */ 72639d30be91SStefano Zampini ierr = PetscMalloc1(buf_size_idxs,&recv_buffer_idxs_local);CHKERRQ(ierr); /* needed for values insertion */ 72649d30be91SStefano Zampini ierr = ISGlobalToLocalMappingApply(l2gmap,IS_GTOLM_MASK,buf_size_idxs,recv_buffer_idxs,&i,recv_buffer_idxs_local);CHKERRQ(ierr); 72659d30be91SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2gmap);CHKERRQ(ierr); 72669d30be91SStefano Zampini 72679d30be91SStefano Zampini /* restore attributes -> type of incoming data and its size */ 72689d30be91SStefano Zampini buf_size_idxs = 0; 72699d30be91SStefano Zampini for (i=0;i<n_recvs;i++) { 72709d30be91SStefano Zampini recv_buffer_idxs_local[buf_size_idxs] = recv_buffer_idxs[buf_size_idxs]; 72719d30be91SStefano Zampini recv_buffer_idxs_local[buf_size_idxs+1] = recv_buffer_idxs[buf_size_idxs+1]; 72729d30be91SStefano Zampini buf_size_idxs += (PetscInt)olengths_idxs[i]; 72739d30be91SStefano Zampini } 72749d30be91SStefano Zampini ierr = PetscFree(recv_buffer_idxs);CHKERRQ(ierr); 72759d30be91SStefano Zampini 72769d30be91SStefano Zampini /* set preallocation */ 72779d30be91SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)local_mat,MATSEQDENSE,&newisdense);CHKERRQ(ierr); 72789d30be91SStefano Zampini if (!newisdense) { 72799d30be91SStefano Zampini PetscInt *new_local_nnz=0; 72809d30be91SStefano Zampini 72819d30be91SStefano Zampini ptr_idxs = recv_buffer_idxs_local; 72829d30be91SStefano Zampini if (n_recvs) { 72839d30be91SStefano Zampini ierr = PetscCalloc1(new_local_rows,&new_local_nnz);CHKERRQ(ierr); 72849d30be91SStefano Zampini } 72859d30be91SStefano Zampini for (i=0;i<n_recvs;i++) { 72869d30be91SStefano Zampini PetscInt j; 72879d30be91SStefano Zampini if (*ptr_idxs == (PetscInt)MATDENSE_PRIVATE) { /* preallocation provided for dense case only */ 72889d30be91SStefano Zampini for (j=0;j<*(ptr_idxs+1);j++) { 72899d30be91SStefano Zampini new_local_nnz[*(ptr_idxs+2+j)] += *(ptr_idxs+1); 72909d30be91SStefano Zampini } 72919d30be91SStefano Zampini } else { 72929d30be91SStefano Zampini /* TODO */ 72939d30be91SStefano Zampini } 72949d30be91SStefano Zampini ptr_idxs += olengths_idxs[i]; 72959d30be91SStefano Zampini } 72969d30be91SStefano Zampini if (new_local_nnz) { 72979d30be91SStefano Zampini for (i=0;i<new_local_rows;i++) new_local_nnz[i] = PetscMin(new_local_nnz[i],new_local_rows); 72989d30be91SStefano Zampini ierr = MatSeqAIJSetPreallocation(local_mat,0,new_local_nnz);CHKERRQ(ierr); 72999d30be91SStefano Zampini for (i=0;i<new_local_rows;i++) new_local_nnz[i] /= bs; 73009d30be91SStefano Zampini ierr = MatSeqBAIJSetPreallocation(local_mat,bs,0,new_local_nnz);CHKERRQ(ierr); 73019d30be91SStefano Zampini for (i=0;i<new_local_rows;i++) new_local_nnz[i] = PetscMax(new_local_nnz[i]-i,0); 73029d30be91SStefano Zampini ierr = MatSeqSBAIJSetPreallocation(local_mat,bs,0,new_local_nnz);CHKERRQ(ierr); 73039d30be91SStefano Zampini } else { 73049d30be91SStefano Zampini ierr = MatSetUp(local_mat);CHKERRQ(ierr); 73059d30be91SStefano Zampini } 73069d30be91SStefano Zampini ierr = PetscFree(new_local_nnz);CHKERRQ(ierr); 73079d30be91SStefano Zampini } else { 73089d30be91SStefano Zampini ierr = MatSetUp(local_mat);CHKERRQ(ierr); 73099d30be91SStefano Zampini } 7310e7931f94SStefano Zampini 7311e7931f94SStefano Zampini /* set values */ 7312e7931f94SStefano Zampini ptr_vals = recv_buffer_vals; 73139d30be91SStefano Zampini ptr_idxs = recv_buffer_idxs_local; 7314e7931f94SStefano Zampini for (i=0;i<n_recvs;i++) { 7315e7931f94SStefano Zampini if (*ptr_idxs == (PetscInt)MATDENSE_PRIVATE) { /* values insertion provided for dense case only */ 7316e7931f94SStefano Zampini ierr = MatSetOption(local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); 73179d30be91SStefano Zampini ierr = MatSetValues(local_mat,*(ptr_idxs+1),ptr_idxs+2,*(ptr_idxs+1),ptr_idxs+2,ptr_vals,ADD_VALUES);CHKERRQ(ierr); 7318e7931f94SStefano Zampini ierr = MatAssemblyBegin(local_mat,MAT_FLUSH_ASSEMBLY);CHKERRQ(ierr); 7319e7931f94SStefano Zampini ierr = MatAssemblyEnd(local_mat,MAT_FLUSH_ASSEMBLY);CHKERRQ(ierr); 7320e7931f94SStefano Zampini ierr = MatSetOption(local_mat,MAT_ROW_ORIENTED,PETSC_TRUE);CHKERRQ(ierr); 732128143c3dSStefano Zampini } else { 732228143c3dSStefano Zampini /* TODO */ 7323e7931f94SStefano Zampini } 7324e7931f94SStefano Zampini ptr_idxs += olengths_idxs[i]; 7325e7931f94SStefano Zampini ptr_vals += olengths_vals[i]; 7326e7931f94SStefano Zampini } 7327e7931f94SStefano Zampini ierr = MatAssemblyBegin(local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 7328e7931f94SStefano Zampini ierr = MatAssemblyEnd(local_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 73293b3b1effSJed Brown ierr = MatISRestoreLocalMat(*mat_n,&local_mat);CHKERRQ(ierr); 733070cf5478SStefano Zampini ierr = MatAssemblyBegin(*mat_n,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 733170cf5478SStefano Zampini ierr = MatAssemblyEnd(*mat_n,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 73329d30be91SStefano Zampini ierr = PetscFree(recv_buffer_vals);CHKERRQ(ierr); 7333e7931f94SStefano Zampini 7334dfd14d43SStefano Zampini #if 0 733528143c3dSStefano Zampini if (!restrict_comm) { /* check */ 7336e7931f94SStefano Zampini Vec lvec,rvec; 7337e7931f94SStefano Zampini PetscReal infty_error; 7338e7931f94SStefano Zampini 73392a7a6963SBarry Smith ierr = MatCreateVecs(mat,&rvec,&lvec);CHKERRQ(ierr); 7340e7931f94SStefano Zampini ierr = VecSetRandom(rvec,NULL);CHKERRQ(ierr); 7341e7931f94SStefano Zampini ierr = MatMult(mat,rvec,lvec);CHKERRQ(ierr); 7342e7931f94SStefano Zampini ierr = VecScale(lvec,-1.0);CHKERRQ(ierr); 734370cf5478SStefano Zampini ierr = MatMultAdd(*mat_n,rvec,lvec,lvec);CHKERRQ(ierr); 7344e7931f94SStefano Zampini ierr = VecNorm(lvec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 7345e7931f94SStefano Zampini ierr = PetscPrintf(PetscObjectComm((PetscObject)mat),"Infinity error subassembling %1.6e\n",infty_error); 7346e7931f94SStefano Zampini ierr = VecDestroy(&rvec);CHKERRQ(ierr); 7347e7931f94SStefano Zampini ierr = VecDestroy(&lvec);CHKERRQ(ierr); 7348e7931f94SStefano Zampini } 734928143c3dSStefano Zampini #endif 7350e7931f94SStefano Zampini 735128143c3dSStefano Zampini /* assemble new additional is (if any) */ 735228143c3dSStefano Zampini if (nis) { 735328143c3dSStefano Zampini PetscInt **temp_idxs,*count_is,j,psum; 735428143c3dSStefano Zampini 735528143c3dSStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_idxs_is,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7356854ce69bSBarry Smith ierr = PetscCalloc1(nis,&count_is);CHKERRQ(ierr); 735728143c3dSStefano Zampini ptr_idxs = recv_buffer_idxs_is; 735828143c3dSStefano Zampini psum = 0; 735928143c3dSStefano Zampini for (i=0;i<n_recvs;i++) { 736028143c3dSStefano Zampini for (j=0;j<nis;j++) { 736128143c3dSStefano Zampini PetscInt plen = *(ptr_idxs); /* first element is the local size of IS's indices */ 736228143c3dSStefano Zampini count_is[j] += plen; /* increment counting of buffer for j-th IS */ 736328143c3dSStefano Zampini psum += plen; 736428143c3dSStefano Zampini ptr_idxs += plen+1; /* shift pointer to received data */ 736528143c3dSStefano Zampini } 736628143c3dSStefano Zampini } 7367854ce69bSBarry Smith ierr = PetscMalloc1(nis,&temp_idxs);CHKERRQ(ierr); 7368854ce69bSBarry Smith ierr = PetscMalloc1(psum,&temp_idxs[0]);CHKERRQ(ierr); 736928143c3dSStefano Zampini for (i=1;i<nis;i++) { 737028143c3dSStefano Zampini temp_idxs[i] = temp_idxs[i-1]+count_is[i-1]; 737128143c3dSStefano Zampini } 737228143c3dSStefano Zampini ierr = PetscMemzero(count_is,nis*sizeof(PetscInt));CHKERRQ(ierr); 737328143c3dSStefano Zampini ptr_idxs = recv_buffer_idxs_is; 737428143c3dSStefano Zampini for (i=0;i<n_recvs;i++) { 737528143c3dSStefano Zampini for (j=0;j<nis;j++) { 737628143c3dSStefano Zampini PetscInt plen = *(ptr_idxs); /* first element is the local size of IS's indices */ 737728143c3dSStefano Zampini ierr = PetscMemcpy(&temp_idxs[j][count_is[j]],ptr_idxs+1,plen*sizeof(PetscInt));CHKERRQ(ierr); 737828143c3dSStefano Zampini count_is[j] += plen; /* increment starting point of buffer for j-th IS */ 737928143c3dSStefano Zampini ptr_idxs += plen+1; /* shift pointer to received data */ 738028143c3dSStefano Zampini } 738128143c3dSStefano Zampini } 738228143c3dSStefano Zampini for (i=0;i<nis;i++) { 738328143c3dSStefano Zampini ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr); 738428143c3dSStefano Zampini ierr = PetscSortRemoveDupsInt(&count_is[i],temp_idxs[i]);CHKERRQ(ierr);CHKERRQ(ierr); 738528143c3dSStefano Zampini ierr = ISCreateGeneral(comm_n,count_is[i],temp_idxs[i],PETSC_COPY_VALUES,&isarray[i]);CHKERRQ(ierr); 738628143c3dSStefano Zampini } 738728143c3dSStefano Zampini ierr = PetscFree(count_is);CHKERRQ(ierr); 738828143c3dSStefano Zampini ierr = PetscFree(temp_idxs[0]);CHKERRQ(ierr); 738928143c3dSStefano Zampini ierr = PetscFree(temp_idxs);CHKERRQ(ierr); 739028143c3dSStefano Zampini } 7391e7931f94SStefano Zampini /* free workspace */ 739228143c3dSStefano Zampini ierr = PetscFree(recv_buffer_idxs_is);CHKERRQ(ierr); 7393e7931f94SStefano Zampini ierr = MPI_Waitall(n_sends,send_req_idxs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7394e7931f94SStefano Zampini ierr = PetscFree(send_buffer_idxs);CHKERRQ(ierr); 7395e7931f94SStefano Zampini ierr = MPI_Waitall(n_sends,send_req_vals,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 7396e7931f94SStefano Zampini if (isdense) { 7397e7931f94SStefano Zampini ierr = MatISGetLocalMat(mat,&local_mat);CHKERRQ(ierr); 7398e7931f94SStefano Zampini ierr = MatDenseRestoreArray(local_mat,&send_buffer_vals);CHKERRQ(ierr); 73993b3b1effSJed Brown ierr = MatISRestoreLocalMat(mat,&local_mat);CHKERRQ(ierr); 7400e7931f94SStefano Zampini } else { 7401e7931f94SStefano Zampini /* ierr = PetscFree(send_buffer_vals);CHKERRQ(ierr); */ 7402e7931f94SStefano Zampini } 740328143c3dSStefano Zampini if (nis) { 740428143c3dSStefano Zampini ierr = MPI_Waitall(n_sends,send_req_idxs_is,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 740528143c3dSStefano Zampini ierr = PetscFree(send_buffer_idxs_is);CHKERRQ(ierr); 740628143c3dSStefano Zampini } 74071ae86dd6SStefano Zampini 74081ae86dd6SStefano Zampini if (nvecs) { 74091ae86dd6SStefano Zampini ierr = MPI_Waitall(n_recvs,recv_req_vecs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 74101ae86dd6SStefano Zampini ierr = MPI_Waitall(n_sends,send_req_vecs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 74111ae86dd6SStefano Zampini ierr = VecRestoreArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 74121ae86dd6SStefano Zampini ierr = VecDestroy(&nnsp_vec[0]);CHKERRQ(ierr); 74131ae86dd6SStefano Zampini ierr = VecCreate(comm_n,&nnsp_vec[0]);CHKERRQ(ierr); 74141ae86dd6SStefano Zampini ierr = VecSetSizes(nnsp_vec[0],new_local_rows,PETSC_DECIDE);CHKERRQ(ierr); 74151ae86dd6SStefano Zampini ierr = VecSetType(nnsp_vec[0],VECSTANDARD);CHKERRQ(ierr); 74161ae86dd6SStefano Zampini /* set values */ 74171ae86dd6SStefano Zampini ptr_vals = recv_buffer_vecs; 74181ae86dd6SStefano Zampini ptr_idxs = recv_buffer_idxs_local; 74191ae86dd6SStefano Zampini ierr = VecGetArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 74201ae86dd6SStefano Zampini for (i=0;i<n_recvs;i++) { 74211ae86dd6SStefano Zampini PetscInt j; 74221ae86dd6SStefano Zampini for (j=0;j<*(ptr_idxs+1);j++) { 74231ae86dd6SStefano Zampini send_buffer_vecs[*(ptr_idxs+2+j)] += *(ptr_vals + j); 74241ae86dd6SStefano Zampini } 74251ae86dd6SStefano Zampini ptr_idxs += olengths_idxs[i]; 74261ae86dd6SStefano Zampini ptr_vals += olengths_idxs[i]-2; 74271ae86dd6SStefano Zampini } 74281ae86dd6SStefano Zampini ierr = VecRestoreArray(nnsp_vec[0],&send_buffer_vecs);CHKERRQ(ierr); 74291ae86dd6SStefano Zampini ierr = VecAssemblyBegin(nnsp_vec[0]);CHKERRQ(ierr); 74301ae86dd6SStefano Zampini ierr = VecAssemblyEnd(nnsp_vec[0]);CHKERRQ(ierr); 74311ae86dd6SStefano Zampini } 74321ae86dd6SStefano Zampini 74331ae86dd6SStefano Zampini ierr = PetscFree(recv_buffer_vecs);CHKERRQ(ierr); 74341ae86dd6SStefano Zampini ierr = PetscFree(recv_buffer_idxs_local);CHKERRQ(ierr); 7435e7931f94SStefano Zampini ierr = PetscFree(recv_req_idxs);CHKERRQ(ierr); 7436e7931f94SStefano Zampini ierr = PetscFree(recv_req_vals);CHKERRQ(ierr); 74371ae86dd6SStefano Zampini ierr = PetscFree(recv_req_vecs);CHKERRQ(ierr); 743828143c3dSStefano Zampini ierr = PetscFree(recv_req_idxs_is);CHKERRQ(ierr); 7439e7931f94SStefano Zampini ierr = PetscFree(send_req_idxs);CHKERRQ(ierr); 7440e7931f94SStefano Zampini ierr = PetscFree(send_req_vals);CHKERRQ(ierr); 74411ae86dd6SStefano Zampini ierr = PetscFree(send_req_vecs);CHKERRQ(ierr); 744228143c3dSStefano Zampini ierr = PetscFree(send_req_idxs_is);CHKERRQ(ierr); 7443e7931f94SStefano Zampini ierr = PetscFree(ilengths_vals);CHKERRQ(ierr); 7444e7931f94SStefano Zampini ierr = PetscFree(ilengths_idxs);CHKERRQ(ierr); 7445e7931f94SStefano Zampini ierr = PetscFree(olengths_vals);CHKERRQ(ierr); 7446e7931f94SStefano Zampini ierr = PetscFree(olengths_idxs);CHKERRQ(ierr); 7447e7931f94SStefano Zampini ierr = PetscFree(onodes);CHKERRQ(ierr); 744828143c3dSStefano Zampini if (nis) { 744928143c3dSStefano Zampini ierr = PetscFree(ilengths_idxs_is);CHKERRQ(ierr); 745028143c3dSStefano Zampini ierr = PetscFree(olengths_idxs_is);CHKERRQ(ierr); 745128143c3dSStefano Zampini ierr = PetscFree(onodes_is);CHKERRQ(ierr); 745228143c3dSStefano Zampini } 745328143c3dSStefano Zampini ierr = PetscSubcommDestroy(&subcomm);CHKERRQ(ierr); 745428143c3dSStefano Zampini if (destroy_mat) { /* destroy mat is true only if restrict comm is true and process will not partecipate */ 745528143c3dSStefano Zampini ierr = MatDestroy(mat_n);CHKERRQ(ierr); 745628143c3dSStefano Zampini for (i=0;i<nis;i++) { 745728143c3dSStefano Zampini ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr); 745828143c3dSStefano Zampini } 74591ae86dd6SStefano Zampini if (nvecs) { /* need to match VecDestroy nnsp_vec called in the other code path */ 74601ae86dd6SStefano Zampini ierr = VecDestroy(&nnsp_vec[0]);CHKERRQ(ierr); 74611ae86dd6SStefano Zampini } 746253a05cb3SStefano Zampini *mat_n = NULL; 746328143c3dSStefano Zampini } 7464e7931f94SStefano Zampini PetscFunctionReturn(0); 7465e7931f94SStefano Zampini } 7466a57a6d2fSStefano Zampini 746712edc857SStefano Zampini /* temporary hack into ksp private data structure */ 7468af0996ceSBarry Smith #include <petsc/private/kspimpl.h> 746912edc857SStefano Zampini 7470c8587f34SStefano Zampini PetscErrorCode PCBDDCSetUpCoarseSolver(PC pc,PetscScalar* coarse_submat_vals) 7471c8587f34SStefano Zampini { 7472c8587f34SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 7473c8587f34SStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 747420a2ab83SStefano Zampini Mat coarse_mat,coarse_mat_is,coarse_submat_dense; 74751ae86dd6SStefano Zampini Mat coarsedivudotp = NULL; 74761e0482f5SStefano Zampini Mat coarseG,t_coarse_mat_is; 74779881197aSStefano Zampini MatNullSpace CoarseNullSpace = NULL; 747820a2ab83SStefano Zampini ISLocalToGlobalMapping coarse_islg; 74796e683305SStefano Zampini IS coarse_is,*isarray; 74806e683305SStefano Zampini PetscInt i,im_active=-1,active_procs=-1; 748130368db7SStefano Zampini PetscInt nis,nisdofs,nisneu,nisvert; 7482f9eb5b7dSStefano Zampini PC pc_temp; 7483c8587f34SStefano Zampini PCType coarse_pc_type; 7484c8587f34SStefano Zampini KSPType coarse_ksp_type; 7485f9eb5b7dSStefano Zampini PetscBool multilevel_requested,multilevel_allowed; 74864f3a063dSStefano Zampini PetscBool isredundant,isbddc,isnn,coarse_reuse; 74871e0482f5SStefano Zampini PetscInt ncoarse,nedcfield; 748868457ee5SStefano Zampini PetscBool compute_vecs = PETSC_FALSE; 748922bc73bbSStefano Zampini PetscScalar *array; 749057de7509SStefano Zampini MatReuse coarse_mat_reuse; 749157de7509SStefano Zampini PetscBool restr, full_restr, have_void; 74927de4f681Sstefano_zampini PetscMPIInt commsize; 74939881197aSStefano Zampini PetscErrorCode ierr; 7494fdc09c96SStefano Zampini 7495c8587f34SStefano Zampini PetscFunctionBegin; 7496c8587f34SStefano Zampini /* Assign global numbering to coarse dofs */ 749768457ee5SStefano Zampini if (pcbddc->new_primal_space || pcbddc->coarse_size == -1) { /* a new primal space is present or it is the first initialization, so recompute global numbering */ 7498fa7f1dd8SStefano Zampini PetscInt ocoarse_size; 74995a75c04eSSatish Balay compute_vecs = PETSC_TRUE; 75007de4f681Sstefano_zampini 75017de4f681Sstefano_zampini pcbddc->new_primal_space = PETSC_TRUE; 7502fa7f1dd8SStefano Zampini ocoarse_size = pcbddc->coarse_size; 7503f4ddd8eeSStefano Zampini ierr = PetscFree(pcbddc->global_primal_indices);CHKERRQ(ierr); 7504f4ddd8eeSStefano Zampini ierr = PCBDDCComputePrimalNumbering(pc,&pcbddc->coarse_size,&pcbddc->global_primal_indices);CHKERRQ(ierr); 7505f4ddd8eeSStefano Zampini /* see if we can avoid some work */ 7506fa7f1dd8SStefano Zampini if (pcbddc->coarse_ksp) { /* coarse ksp has already been created */ 750751bea450SStefano Zampini /* if the coarse size is different or we are using adaptive selection, better to not reuse the coarse matrix */ 750851bea450SStefano Zampini if (ocoarse_size != pcbddc->coarse_size || pcbddc->adaptive_selection) { 7509727cdba6SStefano Zampini ierr = KSPReset(pcbddc->coarse_ksp);CHKERRQ(ierr); 7510fa7f1dd8SStefano Zampini coarse_reuse = PETSC_FALSE; 7511fa7f1dd8SStefano Zampini } else { /* we can safely reuse already computed coarse matrix */ 7512fa7f1dd8SStefano Zampini coarse_reuse = PETSC_TRUE; 7513f4ddd8eeSStefano Zampini } 7514fa7f1dd8SStefano Zampini } else { /* there's no coarse ksp, so we need to create the coarse matrix too */ 7515fa7f1dd8SStefano Zampini coarse_reuse = PETSC_FALSE; 7516f4ddd8eeSStefano Zampini } 751770cf5478SStefano Zampini /* reset any subassembling information */ 751857de7509SStefano Zampini if (!coarse_reuse || pcbddc->recompute_topography) { 751970cf5478SStefano Zampini ierr = ISDestroy(&pcbddc->coarse_subassembling);CHKERRQ(ierr); 752057de7509SStefano Zampini } 75216e683305SStefano Zampini } else { /* primal space is unchanged, so we can reuse coarse matrix */ 7522fa7f1dd8SStefano Zampini coarse_reuse = PETSC_TRUE; 7523f4ddd8eeSStefano Zampini } 752457de7509SStefano Zampini /* assemble coarse matrix */ 752557de7509SStefano Zampini if (coarse_reuse && pcbddc->coarse_ksp) { 752657de7509SStefano Zampini ierr = KSPGetOperators(pcbddc->coarse_ksp,&coarse_mat,NULL);CHKERRQ(ierr); 752757de7509SStefano Zampini ierr = PetscObjectReference((PetscObject)coarse_mat);CHKERRQ(ierr); 752857de7509SStefano Zampini coarse_mat_reuse = MAT_REUSE_MATRIX; 752918a45a71SStefano Zampini } else { 753057de7509SStefano Zampini coarse_mat = NULL; 753157de7509SStefano Zampini coarse_mat_reuse = MAT_INITIAL_MATRIX; 75326e683305SStefano Zampini } 7533e7931f94SStefano Zampini 7534abbbba34SStefano Zampini /* creates temporary l2gmap and IS for coarse indexes */ 7535abbbba34SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),pcbddc->local_primal_size,pcbddc->global_primal_indices,PETSC_COPY_VALUES,&coarse_is);CHKERRQ(ierr); 7536abbbba34SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(coarse_is,&coarse_islg);CHKERRQ(ierr); 7537abbbba34SStefano Zampini 7538abbbba34SStefano Zampini /* creates temporary MATIS object for coarse matrix */ 753922bc73bbSStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,NULL,&coarse_submat_dense);CHKERRQ(ierr); 754022bc73bbSStefano Zampini ierr = MatDenseGetArray(coarse_submat_dense,&array);CHKERRQ(ierr); 754122bc73bbSStefano Zampini ierr = PetscMemcpy(array,coarse_submat_vals,sizeof(*coarse_submat_vals)*pcbddc->local_primal_size*pcbddc->local_primal_size);CHKERRQ(ierr); 754222bc73bbSStefano Zampini ierr = MatDenseRestoreArray(coarse_submat_dense,&array);CHKERRQ(ierr); 7543e176bc59SStefano Zampini ierr = MatCreateIS(PetscObjectComm((PetscObject)pc),1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_islg,NULL,&t_coarse_mat_is);CHKERRQ(ierr); 75446e683305SStefano Zampini ierr = MatISSetLocalMat(t_coarse_mat_is,coarse_submat_dense);CHKERRQ(ierr); 75456e683305SStefano Zampini ierr = MatAssemblyBegin(t_coarse_mat_is,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 75466e683305SStefano Zampini ierr = MatAssemblyEnd(t_coarse_mat_is,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 7547abbbba34SStefano Zampini ierr = MatDestroy(&coarse_submat_dense);CHKERRQ(ierr); 7548abbbba34SStefano Zampini 754957de7509SStefano Zampini /* count "active" (i.e. with positive local size) and "void" processes */ 755057de7509SStefano Zampini im_active = !!(pcis->n); 755157de7509SStefano Zampini ierr = MPIU_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 755257de7509SStefano Zampini 755314f0bfb9SStefano Zampini /* determine number of processes partecipating to coarse solver and compute subassembling pattern */ 755457de7509SStefano Zampini /* restr : whether if we want to exclude senders (which are not receivers) from the subassembling pattern */ 755557de7509SStefano Zampini /* full_restr : just use the receivers from the subassembling pattern */ 75567de4f681Sstefano_zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)pc),&commsize);CHKERRQ(ierr); 755757de7509SStefano Zampini coarse_mat_is = NULL; 755857de7509SStefano Zampini multilevel_allowed = PETSC_FALSE; 755957de7509SStefano Zampini multilevel_requested = PETSC_FALSE; 75601ae86dd6SStefano Zampini pcbddc->coarse_eqs_per_proc = PetscMin(PetscMax(pcbddc->coarse_size,1),pcbddc->coarse_eqs_per_proc); 756157de7509SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) multilevel_requested = PETSC_TRUE; 756257de7509SStefano Zampini if (multilevel_requested) { 756357de7509SStefano Zampini ncoarse = active_procs/pcbddc->coarsening_ratio; 756457de7509SStefano Zampini restr = PETSC_FALSE; 756557de7509SStefano Zampini full_restr = PETSC_FALSE; 756657de7509SStefano Zampini } else { 756757de7509SStefano Zampini ncoarse = pcbddc->coarse_size/pcbddc->coarse_eqs_per_proc; 756857de7509SStefano Zampini restr = PETSC_TRUE; 756957de7509SStefano Zampini full_restr = PETSC_TRUE; 757057de7509SStefano Zampini } 75717de4f681Sstefano_zampini if (!pcbddc->coarse_size || commsize == 1) multilevel_allowed = multilevel_requested = restr = full_restr = PETSC_FALSE; 757257de7509SStefano Zampini ncoarse = PetscMax(1,ncoarse); 757357de7509SStefano Zampini if (!pcbddc->coarse_subassembling) { 7574a198735bSStefano Zampini if (pcbddc->coarsening_ratio > 1) { 7575bb360cb4SStefano Zampini if (multilevel_requested) { 7576bb360cb4SStefano Zampini ierr = PCBDDCMatISGetSubassemblingPattern(pc->pmat,&ncoarse,pcbddc->coarse_adj_red,&pcbddc->coarse_subassembling,&have_void);CHKERRQ(ierr); 7577bb360cb4SStefano Zampini } else { 7578bb360cb4SStefano Zampini ierr = PCBDDCMatISGetSubassemblingPattern(t_coarse_mat_is,&ncoarse,pcbddc->coarse_adj_red,&pcbddc->coarse_subassembling,&have_void);CHKERRQ(ierr); 7579bb360cb4SStefano Zampini } 7580a198735bSStefano Zampini } else { 75817de4f681Sstefano_zampini PetscMPIInt rank; 7582a198735bSStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)pc),&rank);CHKERRQ(ierr); 75837de4f681Sstefano_zampini have_void = (active_procs == (PetscInt)commsize) ? PETSC_FALSE : PETSC_TRUE; 7584a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pc),1,rank,1,&pcbddc->coarse_subassembling);CHKERRQ(ierr); 7585a198735bSStefano Zampini } 758657de7509SStefano Zampini } else { /* if a subassembling pattern exists, then we can reuse the coarse ksp and compute the number of process involved */ 758757de7509SStefano Zampini PetscInt psum; 758857de7509SStefano Zampini if (pcbddc->coarse_ksp) psum = 1; 758957de7509SStefano Zampini else psum = 0; 759057de7509SStefano Zampini ierr = MPIU_Allreduce(&psum,&ncoarse,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 75917de4f681Sstefano_zampini if (ncoarse < commsize) have_void = PETSC_TRUE; 759257de7509SStefano Zampini } 759357de7509SStefano Zampini /* determine if we can go multilevel */ 759457de7509SStefano Zampini if (multilevel_requested) { 759557de7509SStefano Zampini if (ncoarse > 1) multilevel_allowed = PETSC_TRUE; /* found enough processes */ 759657de7509SStefano Zampini else restr = full_restr = PETSC_TRUE; /* 1 subdomain, use a direct solver */ 759757de7509SStefano Zampini } 759857de7509SStefano Zampini if (multilevel_allowed && have_void) restr = PETSC_TRUE; 759957de7509SStefano Zampini 7600e4d548c7SStefano Zampini /* dump subassembling pattern */ 7601e4d548c7SStefano Zampini if (pcbddc->dbg_flag && multilevel_allowed) { 7602e4d548c7SStefano Zampini ierr = ISView(pcbddc->coarse_subassembling,pcbddc->dbg_viewer);CHKERRQ(ierr); 7603e4d548c7SStefano Zampini } 7604e4d548c7SStefano Zampini 76056e683305SStefano Zampini /* compute dofs splitting and neumann boundaries for coarse dofs */ 76061e0482f5SStefano Zampini nedcfield = -1; 76071e0482f5SStefano Zampini if (multilevel_allowed && !coarse_reuse && (pcbddc->n_ISForDofsLocal || pcbddc->NeumannBoundariesLocal || pcbddc->nedclocal)) { /* protects from unneded computations */ 76086e683305SStefano Zampini PetscInt *tidxs,*tidxs2,nout,tsize,i; 76096e683305SStefano Zampini const PetscInt *idxs; 76106e683305SStefano Zampini ISLocalToGlobalMapping tmap; 76116e683305SStefano Zampini 76126e683305SStefano Zampini /* create map between primal indices (in local representative ordering) and local primal numbering */ 76130be93d54SStefano Zampini ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,1,pcbddc->local_primal_size,pcbddc->primal_indices_local_idxs,PETSC_COPY_VALUES,&tmap);CHKERRQ(ierr); 76146e683305SStefano Zampini /* allocate space for temporary storage */ 7615854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->local_primal_size,&tidxs);CHKERRQ(ierr); 7616854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->local_primal_size,&tidxs2);CHKERRQ(ierr); 76176e683305SStefano Zampini /* allocate for IS array */ 76186e683305SStefano Zampini nisdofs = pcbddc->n_ISForDofsLocal; 76191e0482f5SStefano Zampini if (pcbddc->nedclocal) { 76201e0482f5SStefano Zampini if (pcbddc->nedfield > -1) { 76211e0482f5SStefano Zampini nedcfield = pcbddc->nedfield; 76221e0482f5SStefano Zampini } else { 76231e0482f5SStefano Zampini nedcfield = 0; 76241e0482f5SStefano Zampini if (nisdofs) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"This should not happen (%d)",nisdofs); 76251e0482f5SStefano Zampini nisdofs = 1; 76261e0482f5SStefano Zampini } 76271e0482f5SStefano Zampini } 76286e683305SStefano Zampini nisneu = !!pcbddc->NeumannBoundariesLocal; 762927b6a85dSStefano Zampini nisvert = 0; /* nisvert is not used */ 763030368db7SStefano Zampini nis = nisdofs + nisneu + nisvert; 7631854ce69bSBarry Smith ierr = PetscMalloc1(nis,&isarray);CHKERRQ(ierr); 76326e683305SStefano Zampini /* dofs splitting */ 76336e683305SStefano Zampini for (i=0;i<nisdofs;i++) { 76346e683305SStefano Zampini /* ierr = ISView(pcbddc->ISForDofsLocal[i],0);CHKERRQ(ierr); */ 76351e0482f5SStefano Zampini if (nedcfield != i) { 76366e683305SStefano Zampini ierr = ISGetLocalSize(pcbddc->ISForDofsLocal[i],&tsize);CHKERRQ(ierr); 76376e683305SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofsLocal[i],&idxs);CHKERRQ(ierr); 76386e683305SStefano Zampini ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr); 76396e683305SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofsLocal[i],&idxs);CHKERRQ(ierr); 76401e0482f5SStefano Zampini } else { 76411e0482f5SStefano Zampini ierr = ISGetLocalSize(pcbddc->nedclocal,&tsize);CHKERRQ(ierr); 76421e0482f5SStefano Zampini ierr = ISGetIndices(pcbddc->nedclocal,&idxs);CHKERRQ(ierr); 76431e0482f5SStefano Zampini ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr); 7644eee23b56SStefano Zampini if (tsize != nout) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Failed when mapping coarse nedelec field! %d != %d\n",tsize,nout); 76451e0482f5SStefano Zampini ierr = ISRestoreIndices(pcbddc->nedclocal,&idxs);CHKERRQ(ierr); 76461e0482f5SStefano Zampini } 76476e683305SStefano Zampini ierr = ISLocalToGlobalMappingApply(coarse_islg,nout,tidxs,tidxs2);CHKERRQ(ierr); 764830368db7SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),nout,tidxs2,PETSC_COPY_VALUES,&isarray[i]);CHKERRQ(ierr); 76496e683305SStefano Zampini /* ierr = ISView(isarray[i],0);CHKERRQ(ierr); */ 76506e683305SStefano Zampini } 76516e683305SStefano Zampini /* neumann boundaries */ 76526e683305SStefano Zampini if (pcbddc->NeumannBoundariesLocal) { 76536e683305SStefano Zampini /* ierr = ISView(pcbddc->NeumannBoundariesLocal,0);CHKERRQ(ierr); */ 76546e683305SStefano Zampini ierr = ISGetLocalSize(pcbddc->NeumannBoundariesLocal,&tsize);CHKERRQ(ierr); 76556e683305SStefano Zampini ierr = ISGetIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 76566e683305SStefano Zampini ierr = ISGlobalToLocalMappingApply(tmap,IS_GTOLM_DROP,tsize,idxs,&nout,tidxs);CHKERRQ(ierr); 76576e683305SStefano Zampini ierr = ISRestoreIndices(pcbddc->NeumannBoundariesLocal,&idxs);CHKERRQ(ierr); 76586e683305SStefano Zampini ierr = ISLocalToGlobalMappingApply(coarse_islg,nout,tidxs,tidxs2);CHKERRQ(ierr); 765930368db7SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),nout,tidxs2,PETSC_COPY_VALUES,&isarray[nisdofs]);CHKERRQ(ierr); 76606e683305SStefano Zampini /* ierr = ISView(isarray[nisdofs],0);CHKERRQ(ierr); */ 76616e683305SStefano Zampini } 76626e683305SStefano Zampini /* free memory */ 76636e683305SStefano Zampini ierr = PetscFree(tidxs);CHKERRQ(ierr); 76646e683305SStefano Zampini ierr = PetscFree(tidxs2);CHKERRQ(ierr); 76656e683305SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&tmap);CHKERRQ(ierr); 76666e683305SStefano Zampini } else { 76676e683305SStefano Zampini nis = 0; 76686e683305SStefano Zampini nisdofs = 0; 76696e683305SStefano Zampini nisneu = 0; 767030368db7SStefano Zampini nisvert = 0; 76716e683305SStefano Zampini isarray = NULL; 76726e683305SStefano Zampini } 76736e683305SStefano Zampini /* destroy no longer needed map */ 76746e683305SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&coarse_islg);CHKERRQ(ierr); 76756e683305SStefano Zampini 767657de7509SStefano Zampini /* subassemble */ 767757de7509SStefano Zampini if (multilevel_allowed) { 76781ae86dd6SStefano Zampini Vec vp[1]; 76791ae86dd6SStefano Zampini PetscInt nvecs = 0; 768057de7509SStefano Zampini PetscBool reuse,reuser; 76811ae86dd6SStefano Zampini 768257de7509SStefano Zampini if (coarse_mat) reuse = PETSC_TRUE; 768357de7509SStefano Zampini else reuse = PETSC_FALSE; 768457de7509SStefano Zampini ierr = MPIU_Allreduce(&reuse,&reuser,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 76851ae86dd6SStefano Zampini vp[0] = NULL; 76861ae86dd6SStefano Zampini if (pcbddc->benign_have_null) { /* propagate no-net-flux quadrature to coarser level */ 76871ae86dd6SStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pc),&vp[0]);CHKERRQ(ierr); 76881ae86dd6SStefano Zampini ierr = VecSetSizes(vp[0],pcbddc->local_primal_size,PETSC_DECIDE);CHKERRQ(ierr); 76891ae86dd6SStefano Zampini ierr = VecSetType(vp[0],VECSTANDARD);CHKERRQ(ierr); 76901ae86dd6SStefano Zampini nvecs = 1; 76911ae86dd6SStefano Zampini 76921ae86dd6SStefano Zampini if (pcbddc->divudotp) { 7693a198735bSStefano Zampini Mat B,loc_divudotp; 76941ae86dd6SStefano Zampini Vec v,p; 76951ae86dd6SStefano Zampini IS dummy; 76961ae86dd6SStefano Zampini PetscInt np; 76971ae86dd6SStefano Zampini 7698a198735bSStefano Zampini ierr = MatISGetLocalMat(pcbddc->divudotp,&loc_divudotp);CHKERRQ(ierr); 7699a198735bSStefano Zampini ierr = MatGetSize(loc_divudotp,&np,NULL);CHKERRQ(ierr); 77001ae86dd6SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,np,0,1,&dummy);CHKERRQ(ierr); 77017dae84e0SHong Zhang ierr = MatCreateSubMatrix(loc_divudotp,dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr); 77021ae86dd6SStefano Zampini ierr = MatCreateVecs(B,&v,&p);CHKERRQ(ierr); 77031ae86dd6SStefano Zampini ierr = VecSet(p,1.);CHKERRQ(ierr); 77041ae86dd6SStefano Zampini ierr = MatMultTranspose(B,p,v);CHKERRQ(ierr); 77051ae86dd6SStefano Zampini ierr = VecDestroy(&p);CHKERRQ(ierr); 77061ae86dd6SStefano Zampini ierr = MatDestroy(&B);CHKERRQ(ierr); 77071ae86dd6SStefano Zampini ierr = VecGetArray(vp[0],&array);CHKERRQ(ierr); 77081ae86dd6SStefano Zampini ierr = VecPlaceArray(pcbddc->vec1_P,array);CHKERRQ(ierr); 77091ae86dd6SStefano Zampini ierr = VecRestoreArray(vp[0],&array);CHKERRQ(ierr); 77101ae86dd6SStefano Zampini ierr = MatMultTranspose(pcbddc->coarse_phi_B,v,pcbddc->vec1_P);CHKERRQ(ierr); 77111ae86dd6SStefano Zampini ierr = VecResetArray(pcbddc->vec1_P);CHKERRQ(ierr); 77121ae86dd6SStefano Zampini ierr = ISDestroy(&dummy);CHKERRQ(ierr); 77131ae86dd6SStefano Zampini ierr = VecDestroy(&v);CHKERRQ(ierr); 771474e2c79eSStefano Zampini } 77151ae86dd6SStefano Zampini } 77161ae86dd6SStefano Zampini if (reuser) { 77171e0482f5SStefano Zampini ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_TRUE,&coarse_mat,nis,isarray,nvecs,vp);CHKERRQ(ierr); 771874e2c79eSStefano Zampini } else { 77191e0482f5SStefano Zampini ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_FALSE,&coarse_mat_is,nis,isarray,nvecs,vp);CHKERRQ(ierr); 77201ae86dd6SStefano Zampini } 77211ae86dd6SStefano Zampini if (vp[0]) { /* vp[0] could have been placed on a different set of processes */ 77221ae86dd6SStefano Zampini PetscScalar *arraym,*arrayv; 77231ae86dd6SStefano Zampini PetscInt nl; 77241ae86dd6SStefano Zampini ierr = VecGetLocalSize(vp[0],&nl);CHKERRQ(ierr); 77251ae86dd6SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,1,nl,NULL,&coarsedivudotp);CHKERRQ(ierr); 77261ae86dd6SStefano Zampini ierr = MatDenseGetArray(coarsedivudotp,&arraym);CHKERRQ(ierr); 77271ae86dd6SStefano Zampini ierr = VecGetArray(vp[0],&arrayv);CHKERRQ(ierr); 77281ae86dd6SStefano Zampini ierr = PetscMemcpy(arraym,arrayv,nl*sizeof(PetscScalar));CHKERRQ(ierr); 77291ae86dd6SStefano Zampini ierr = VecRestoreArray(vp[0],&arrayv);CHKERRQ(ierr); 77301ae86dd6SStefano Zampini ierr = MatDenseRestoreArray(coarsedivudotp,&arraym);CHKERRQ(ierr); 77311ae86dd6SStefano Zampini ierr = VecDestroy(&vp[0]);CHKERRQ(ierr); 7732a198735bSStefano Zampini } else { 7733a198735bSStefano Zampini ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,0,0,1,NULL,&coarsedivudotp);CHKERRQ(ierr); 77341ae86dd6SStefano Zampini } 77351ae86dd6SStefano Zampini } else { 77361e0482f5SStefano Zampini ierr = PCBDDCMatISSubassemble(t_coarse_mat_is,pcbddc->coarse_subassembling,0,restr,full_restr,PETSC_FALSE,&coarse_mat_is,0,NULL,0,NULL);CHKERRQ(ierr); 77376e683305SStefano Zampini } 773857de7509SStefano Zampini if (coarse_mat_is || coarse_mat) { 773957de7509SStefano Zampini PetscMPIInt size; 7740f913dca9SStefano Zampini ierr = MPI_Comm_size(PetscObjectComm((PetscObject)coarse_mat_is),&size);CHKERRQ(ierr); 774157de7509SStefano Zampini if (!multilevel_allowed) { 774257de7509SStefano Zampini ierr = MatISGetMPIXAIJ(coarse_mat_is,coarse_mat_reuse,&coarse_mat);CHKERRQ(ierr); 77436e683305SStefano Zampini } else { 774457de7509SStefano Zampini Mat A; 7745779c1cceSStefano Zampini 774657de7509SStefano Zampini /* if this matrix is present, it means we are not reusing the coarse matrix */ 774757de7509SStefano Zampini if (coarse_mat_is) { 774857de7509SStefano Zampini if (coarse_mat) SETERRQ(PetscObjectComm((PetscObject)coarse_mat_is),PETSC_ERR_PLIB,"This should not happen"); 774957de7509SStefano Zampini ierr = PetscObjectReference((PetscObject)coarse_mat_is);CHKERRQ(ierr); 775057de7509SStefano Zampini coarse_mat = coarse_mat_is; 775157de7509SStefano Zampini } 775257de7509SStefano Zampini /* be sure we don't have MatSeqDENSE as local mat */ 775357de7509SStefano Zampini ierr = MatISGetLocalMat(coarse_mat,&A);CHKERRQ(ierr); 775457de7509SStefano Zampini ierr = MatConvert(A,MATSEQAIJ,MAT_INPLACE_MATRIX,&A);CHKERRQ(ierr); 7755779c1cceSStefano Zampini } 7756779c1cceSStefano Zampini } 775757de7509SStefano Zampini ierr = MatDestroy(&t_coarse_mat_is);CHKERRQ(ierr); 775857de7509SStefano Zampini ierr = MatDestroy(&coarse_mat_is);CHKERRQ(ierr); 77596e683305SStefano Zampini 77606e683305SStefano Zampini /* create local to global scatters for coarse problem */ 776168457ee5SStefano Zampini if (compute_vecs) { 77626e683305SStefano Zampini PetscInt lrows; 77636e683305SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 776457de7509SStefano Zampini if (coarse_mat) { 776557de7509SStefano Zampini ierr = MatGetLocalSize(coarse_mat,&lrows,NULL);CHKERRQ(ierr); 77666e683305SStefano Zampini } else { 77676e683305SStefano Zampini lrows = 0; 77686e683305SStefano Zampini } 77696e683305SStefano Zampini ierr = VecCreate(PetscObjectComm((PetscObject)pc),&pcbddc->coarse_vec);CHKERRQ(ierr); 77706e683305SStefano Zampini ierr = VecSetSizes(pcbddc->coarse_vec,lrows,PETSC_DECIDE);CHKERRQ(ierr); 77716e683305SStefano Zampini ierr = VecSetType(pcbddc->coarse_vec,VECSTANDARD);CHKERRQ(ierr); 77726e683305SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 77736e683305SStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_P,NULL,pcbddc->coarse_vec,coarse_is,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 77746e683305SStefano Zampini } 77756e683305SStefano Zampini ierr = ISDestroy(&coarse_is);CHKERRQ(ierr); 7776c8587f34SStefano Zampini 7777f9eb5b7dSStefano Zampini /* set defaults for coarse KSP and PC */ 7778f9eb5b7dSStefano Zampini if (multilevel_allowed) { 7779f9eb5b7dSStefano Zampini coarse_ksp_type = KSPRICHARDSON; 7780f9eb5b7dSStefano Zampini coarse_pc_type = PCBDDC; 7781f9eb5b7dSStefano Zampini } else { 7782f9eb5b7dSStefano Zampini coarse_ksp_type = KSPPREONLY; 7783f9eb5b7dSStefano Zampini coarse_pc_type = PCREDUNDANT; 7784c8587f34SStefano Zampini } 7785c8587f34SStefano Zampini 77866e683305SStefano Zampini /* print some info if requested */ 77876e683305SStefano Zampini if (pcbddc->dbg_flag) { 77886e683305SStefano Zampini if (!multilevel_allowed) { 77896e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 77906e683305SStefano Zampini if (multilevel_requested) { 77916e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Not enough active processes on level %d (active processes %d, coarsening ratio %d)\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 77926e683305SStefano Zampini } else if (pcbddc->max_levels) { 77936e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Maximum number of requested levels reached (%d)\n",pcbddc->max_levels);CHKERRQ(ierr); 77946e683305SStefano Zampini } 77956e683305SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 77966e683305SStefano Zampini } 77976e683305SStefano Zampini } 77986e683305SStefano Zampini 77991e0482f5SStefano Zampini /* communicate coarse discrete gradient */ 78001e0482f5SStefano Zampini coarseG = NULL; 78011e0482f5SStefano Zampini if (pcbddc->nedcG && multilevel_allowed) { 78021e0482f5SStefano Zampini MPI_Comm ccomm; 78031e0482f5SStefano Zampini if (coarse_mat) { 78041e0482f5SStefano Zampini ccomm = PetscObjectComm((PetscObject)coarse_mat); 78051e0482f5SStefano Zampini } else { 78061e0482f5SStefano Zampini ccomm = MPI_COMM_NULL; 78071e0482f5SStefano Zampini } 78081e0482f5SStefano Zampini ierr = MatMPIAIJRestrict(pcbddc->nedcG,ccomm,&coarseG);CHKERRQ(ierr); 78091e0482f5SStefano Zampini } 78101e0482f5SStefano Zampini 7811f9eb5b7dSStefano Zampini /* create the coarse KSP object only once with defaults */ 781257de7509SStefano Zampini if (coarse_mat) { 78136a1308c2SStefano Zampini PetscViewer dbg_viewer = NULL; 78146e683305SStefano Zampini if (pcbddc->dbg_flag) { 781557de7509SStefano Zampini dbg_viewer = PETSC_VIEWER_STDOUT_(PetscObjectComm((PetscObject)coarse_mat)); 78166e683305SStefano Zampini ierr = PetscViewerASCIIAddTab(dbg_viewer,2*pcbddc->current_level);CHKERRQ(ierr); 78176e683305SStefano Zampini } 7818f9eb5b7dSStefano Zampini if (!pcbddc->coarse_ksp) { 7819312be037SStefano Zampini char prefix[256],str_level[16]; 7820e604994aSStefano Zampini size_t len; 78211e0482f5SStefano Zampini 782257de7509SStefano Zampini ierr = KSPCreate(PetscObjectComm((PetscObject)coarse_mat),&pcbddc->coarse_ksp);CHKERRQ(ierr); 7823422a814eSBarry Smith ierr = KSPSetErrorIfNotConverged(pcbddc->coarse_ksp,pc->erroriffailure);CHKERRQ(ierr); 7824c8587f34SStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 7825f9eb5b7dSStefano Zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,1);CHKERRQ(ierr); 782657de7509SStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr); 7827c8587f34SStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 78286e683305SStefano Zampini ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr); 7829c8587f34SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 78301e0482f5SStefano Zampini /* TODO is this logic correct? should check for coarse_mat type */ 7831c8587f34SStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 7832e604994aSStefano Zampini /* prefix */ 7833e604994aSStefano Zampini ierr = PetscStrcpy(prefix,"");CHKERRQ(ierr); 7834e604994aSStefano Zampini ierr = PetscStrcpy(str_level,"");CHKERRQ(ierr); 7835e604994aSStefano Zampini if (!pcbddc->current_level) { 7836e604994aSStefano Zampini ierr = PetscStrcpy(prefix,((PetscObject)pc)->prefix);CHKERRQ(ierr); 7837e604994aSStefano Zampini ierr = PetscStrcat(prefix,"pc_bddc_coarse_");CHKERRQ(ierr); 7838c8587f34SStefano Zampini } else { 7839e604994aSStefano Zampini ierr = PetscStrlen(((PetscObject)pc)->prefix,&len);CHKERRQ(ierr); 7840312be037SStefano Zampini if (pcbddc->current_level>1) len -= 3; /* remove "lX_" with X level number */ 7841312be037SStefano Zampini if (pcbddc->current_level>10) len -= 1; /* remove another char from level number */ 784234d6797cSStefano Zampini ierr = PetscStrncpy(prefix,((PetscObject)pc)->prefix,len+1);CHKERRQ(ierr); 7843312be037SStefano Zampini sprintf(str_level,"l%d_",(int)(pcbddc->current_level)); 7844e604994aSStefano Zampini ierr = PetscStrcat(prefix,str_level);CHKERRQ(ierr); 7845e604994aSStefano Zampini } 7846e604994aSStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,prefix);CHKERRQ(ierr); 78473e3c6dadSStefano Zampini /* propagate BDDC info to the next level (these are dummy calls if pc_temp is not of type PCBDDC) */ 78483e3c6dadSStefano Zampini ierr = PCBDDCSetLevel(pc_temp,pcbddc->current_level+1);CHKERRQ(ierr); 78493e3c6dadSStefano Zampini ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr); 78503e3c6dadSStefano Zampini ierr = PCBDDCSetLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr); 7851f9eb5b7dSStefano Zampini /* allow user customization */ 7852f9eb5b7dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 78533e3c6dadSStefano Zampini } 78543e3c6dadSStefano Zampini /* propagate BDDC info to the next level (these are dummy calls if pc_temp is not of type PCBDDC) */ 785551bea450SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 78563e3c6dadSStefano Zampini if (nisdofs) { 78573e3c6dadSStefano Zampini ierr = PCBDDCSetDofsSplitting(pc_temp,nisdofs,isarray);CHKERRQ(ierr); 78583e3c6dadSStefano Zampini for (i=0;i<nisdofs;i++) { 78593e3c6dadSStefano Zampini ierr = ISDestroy(&isarray[i]);CHKERRQ(ierr); 78603e3c6dadSStefano Zampini } 78613e3c6dadSStefano Zampini } 78623e3c6dadSStefano Zampini if (nisneu) { 78633e3c6dadSStefano Zampini ierr = PCBDDCSetNeumannBoundaries(pc_temp,isarray[nisdofs]);CHKERRQ(ierr); 78643e3c6dadSStefano Zampini ierr = ISDestroy(&isarray[nisdofs]);CHKERRQ(ierr); 7865312be037SStefano Zampini } 786630368db7SStefano Zampini if (nisvert) { 786730368db7SStefano Zampini ierr = PCBDDCSetPrimalVerticesIS(pc_temp,isarray[nis-1]);CHKERRQ(ierr); 786830368db7SStefano Zampini ierr = ISDestroy(&isarray[nis-1]);CHKERRQ(ierr); 786930368db7SStefano Zampini } 78701e0482f5SStefano Zampini if (coarseG) { 78711e0482f5SStefano Zampini ierr = PCBDDCSetDiscreteGradient(pc_temp,coarseG,1,nedcfield,PETSC_FALSE,PETSC_TRUE);CHKERRQ(ierr); 78721e0482f5SStefano Zampini } 7873f9eb5b7dSStefano Zampini 7874f9eb5b7dSStefano Zampini /* get some info after set from options */ 7875f9eb5b7dSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCNN,&isnn);CHKERRQ(ierr); 7876f9eb5b7dSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr); 78774f3a063dSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCREDUNDANT,&isredundant);CHKERRQ(ierr); 7878b76f3995Sstefano_zampini /* multilevel can only be requested via -pc_bddc_levels or PCBDDCSetLevels */ 7879b76f3995Sstefano_zampini if (isbddc && !multilevel_allowed) { 7880f9eb5b7dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 7881f9eb5b7dSStefano Zampini isbddc = PETSC_FALSE; 7882f9eb5b7dSStefano Zampini } 7883b76f3995Sstefano_zampini /* multilevel cannot be done with coarse PCs different from BDDC or NN */ 7884b76f3995Sstefano_zampini if (multilevel_requested && !isbddc && !isnn) { 7885b76f3995Sstefano_zampini ierr = PCSetType(pc_temp,PCBDDC);CHKERRQ(ierr); 7886b76f3995Sstefano_zampini isbddc = PETSC_TRUE; 7887b76f3995Sstefano_zampini isnn = PETSC_FALSE; 7888b76f3995Sstefano_zampini } 788939f0f02cSStefano Zampini ierr = PCFactorSetReuseFill(pc_temp,PETSC_TRUE);CHKERRQ(ierr); 78904f3a063dSStefano Zampini if (isredundant) { 78914f3a063dSStefano Zampini KSP inner_ksp; 78924f3a063dSStefano Zampini PC inner_pc; 78939326c5c6Sstefano_zampini 78944f3a063dSStefano Zampini ierr = PCRedundantGetKSP(pc_temp,&inner_ksp);CHKERRQ(ierr); 78954f3a063dSStefano Zampini ierr = KSPGetPC(inner_ksp,&inner_pc);CHKERRQ(ierr); 78964f3a063dSStefano Zampini ierr = PCFactorSetReuseFill(inner_pc,PETSC_TRUE);CHKERRQ(ierr); 78974f3a063dSStefano Zampini } 7898f9eb5b7dSStefano Zampini 789957de7509SStefano Zampini /* parameters which miss an API */ 790057de7509SStefano Zampini if (isbddc) { 7901720d30f9SStefano Zampini PC_BDDC* pcbddc_coarse = (PC_BDDC*)pc_temp->data; 7902720d30f9SStefano Zampini pcbddc_coarse->detect_disconnected = PETSC_TRUE; 790357de7509SStefano Zampini pcbddc_coarse->coarse_eqs_per_proc = pcbddc->coarse_eqs_per_proc; 790427b6a85dSStefano Zampini pcbddc_coarse->benign_saddle_point = pcbddc->benign_have_null; 790527b6a85dSStefano Zampini if (pcbddc_coarse->benign_saddle_point) { 7906a198735bSStefano Zampini Mat coarsedivudotp_is; 7907a198735bSStefano Zampini ISLocalToGlobalMapping l2gmap,rl2g,cl2g; 7908a198735bSStefano Zampini IS row,col; 7909a198735bSStefano Zampini const PetscInt *gidxs; 7910a198735bSStefano Zampini PetscInt n,st,M,N; 7911a198735bSStefano Zampini 7912a198735bSStefano Zampini ierr = MatGetSize(coarsedivudotp,&n,NULL);CHKERRQ(ierr); 7913a198735bSStefano Zampini ierr = MPI_Scan(&n,&st,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)coarse_mat));CHKERRQ(ierr); 7914a198735bSStefano Zampini st = st-n; 7915a198735bSStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)coarse_mat),1,st,1,&row);CHKERRQ(ierr); 7916a198735bSStefano Zampini ierr = MatGetLocalToGlobalMapping(coarse_mat,&l2gmap,NULL);CHKERRQ(ierr); 7917a198735bSStefano Zampini ierr = ISLocalToGlobalMappingGetSize(l2gmap,&n);CHKERRQ(ierr); 7918a198735bSStefano Zampini ierr = ISLocalToGlobalMappingGetIndices(l2gmap,&gidxs);CHKERRQ(ierr); 7919a198735bSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)coarse_mat),n,gidxs,PETSC_COPY_VALUES,&col);CHKERRQ(ierr); 7920a198735bSStefano Zampini ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap,&gidxs);CHKERRQ(ierr); 7921a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(row,&rl2g);CHKERRQ(ierr); 7922a198735bSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(col,&cl2g);CHKERRQ(ierr); 7923a198735bSStefano Zampini ierr = ISGetSize(row,&M);CHKERRQ(ierr); 7924a198735bSStefano Zampini ierr = MatGetSize(coarse_mat,&N,NULL);CHKERRQ(ierr); 7925a198735bSStefano Zampini ierr = ISDestroy(&row);CHKERRQ(ierr); 7926a198735bSStefano Zampini ierr = ISDestroy(&col);CHKERRQ(ierr); 7927a198735bSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)coarse_mat),&coarsedivudotp_is);CHKERRQ(ierr); 7928a198735bSStefano Zampini ierr = MatSetType(coarsedivudotp_is,MATIS);CHKERRQ(ierr); 7929a198735bSStefano Zampini ierr = MatSetSizes(coarsedivudotp_is,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 7930a198735bSStefano Zampini ierr = MatSetLocalToGlobalMapping(coarsedivudotp_is,rl2g,cl2g);CHKERRQ(ierr); 7931a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&rl2g);CHKERRQ(ierr); 7932a198735bSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&cl2g);CHKERRQ(ierr); 7933a198735bSStefano Zampini ierr = MatISSetLocalMat(coarsedivudotp_is,coarsedivudotp);CHKERRQ(ierr); 7934a198735bSStefano Zampini ierr = MatDestroy(&coarsedivudotp);CHKERRQ(ierr); 79358ae0ca82SStefano Zampini ierr = PCBDDCSetDivergenceMat(pc_temp,coarsedivudotp_is,PETSC_FALSE,NULL);CHKERRQ(ierr); 7936a198735bSStefano Zampini ierr = MatDestroy(&coarsedivudotp_is);CHKERRQ(ierr); 7937720d30f9SStefano Zampini pcbddc_coarse->adaptive_userdefined = PETSC_TRUE; 793859e48ca4SStefano Zampini if (pcbddc->adaptive_threshold < 1.0) pcbddc_coarse->deluxe_zerorows = PETSC_TRUE; 7939720d30f9SStefano Zampini } 7940d4d8cf7bSStefano Zampini } 79419881197aSStefano Zampini 79423301b35fSStefano Zampini /* propagate symmetry info of coarse matrix */ 79435a16e3a0SStefano Zampini ierr = MatSetOption(coarse_mat,MAT_STRUCTURALLY_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 79443301b35fSStefano Zampini if (pc->pmat->symmetric_set) { 79453301b35fSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_SYMMETRIC,pc->pmat->symmetric);CHKERRQ(ierr); 79463301b35fSStefano Zampini } 79473301b35fSStefano Zampini if (pc->pmat->hermitian_set) { 79483301b35fSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_HERMITIAN,pc->pmat->hermitian);CHKERRQ(ierr); 79493301b35fSStefano Zampini } 79503301b35fSStefano Zampini if (pc->pmat->spd_set) { 79513301b35fSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_SPD,pc->pmat->spd);CHKERRQ(ierr); 79523301b35fSStefano Zampini } 795327b6a85dSStefano Zampini if (pcbddc->benign_saddle_point && !pcbddc->benign_have_null) { 795427b6a85dSStefano Zampini ierr = MatSetOption(coarse_mat,MAT_SPD,PETSC_TRUE);CHKERRQ(ierr); 795527b6a85dSStefano Zampini } 79566e683305SStefano Zampini /* set operators */ 79575f76c7aeSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr); 79586e683305SStefano Zampini if (pcbddc->dbg_flag) { 79596e683305SStefano Zampini ierr = PetscViewerASCIISubtractTab(dbg_viewer,2*pcbddc->current_level);CHKERRQ(ierr); 79606e683305SStefano Zampini } 79616e683305SStefano Zampini } 79621e0482f5SStefano Zampini ierr = MatDestroy(&coarseG);CHKERRQ(ierr); 79636e683305SStefano Zampini ierr = PetscFree(isarray);CHKERRQ(ierr); 7964b1ecc7b1SStefano Zampini #if 0 7965b9b85e73SStefano Zampini { 7966b9b85e73SStefano Zampini PetscViewer viewer; 7967b9b85e73SStefano Zampini char filename[256]; 7968b1ecc7b1SStefano Zampini sprintf(filename,"coarse_mat_level%d.m",pcbddc->current_level); 7969b1ecc7b1SStefano Zampini ierr = PetscViewerASCIIOpen(PetscObjectComm((PetscObject)coarse_mat),filename,&viewer);CHKERRQ(ierr); 79706a9046bcSBarry Smith ierr = PetscViewerPushFormat(viewer,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 7971b9b85e73SStefano Zampini ierr = MatView(coarse_mat,viewer);CHKERRQ(ierr); 7972f159cad9SBarry Smith ierr = PetscViewerPopFormat(viewer);CHKERRQ(ierr); 7973b9b85e73SStefano Zampini ierr = PetscViewerDestroy(&viewer);CHKERRQ(ierr); 7974b9b85e73SStefano Zampini } 7975b9b85e73SStefano Zampini #endif 7976f9eb5b7dSStefano Zampini 797798a51de6SStefano Zampini if (pcbddc->coarse_ksp) { 797898a51de6SStefano Zampini Vec crhs,csol; 797904708bb6SStefano Zampini 7980f347579bSStefano Zampini ierr = KSPGetSolution(pcbddc->coarse_ksp,&csol);CHKERRQ(ierr); 7981f347579bSStefano Zampini ierr = KSPGetRhs(pcbddc->coarse_ksp,&crhs);CHKERRQ(ierr); 7982f347579bSStefano Zampini if (!csol) { 79832a7a6963SBarry Smith ierr = MatCreateVecs(coarse_mat,&((pcbddc->coarse_ksp)->vec_sol),NULL);CHKERRQ(ierr); 7984f9eb5b7dSStefano Zampini } 7985f347579bSStefano Zampini if (!crhs) { 79862a7a6963SBarry Smith ierr = MatCreateVecs(coarse_mat,NULL,&((pcbddc->coarse_ksp)->vec_rhs));CHKERRQ(ierr); 7987f347579bSStefano Zampini } 7988b0f5fe93SStefano Zampini } 79891ae86dd6SStefano Zampini ierr = MatDestroy(&coarsedivudotp);CHKERRQ(ierr); 7990b0f5fe93SStefano Zampini 7991b0f5fe93SStefano Zampini /* compute null space for coarse solver if the benign trick has been requested */ 7992b0f5fe93SStefano Zampini if (pcbddc->benign_null) { 7993b0f5fe93SStefano Zampini 7994b0f5fe93SStefano Zampini ierr = VecSet(pcbddc->vec1_P,0.);CHKERRQ(ierr); 79954f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 79964f1b2e48SStefano Zampini ierr = VecSetValue(pcbddc->vec1_P,pcbddc->local_primal_size-pcbddc->benign_n+i,1.0,INSERT_VALUES);CHKERRQ(ierr); 79974f1b2e48SStefano Zampini } 7998b0f5fe93SStefano Zampini ierr = VecAssemblyBegin(pcbddc->vec1_P);CHKERRQ(ierr); 7999b0f5fe93SStefano Zampini ierr = VecAssemblyEnd(pcbddc->vec1_P);CHKERRQ(ierr); 8000b0f5fe93SStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8001b0f5fe93SStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8002b0f5fe93SStefano Zampini if (coarse_mat) { 8003b0f5fe93SStefano Zampini Vec nullv; 8004b0f5fe93SStefano Zampini PetscScalar *array,*array2; 8005b0f5fe93SStefano Zampini PetscInt nl; 8006b0f5fe93SStefano Zampini 8007b0f5fe93SStefano Zampini ierr = MatCreateVecs(coarse_mat,&nullv,NULL);CHKERRQ(ierr); 8008b0f5fe93SStefano Zampini ierr = VecGetLocalSize(nullv,&nl);CHKERRQ(ierr); 8009b0f5fe93SStefano Zampini ierr = VecGetArrayRead(pcbddc->coarse_vec,(const PetscScalar**)&array);CHKERRQ(ierr); 8010b0f5fe93SStefano Zampini ierr = VecGetArray(nullv,&array2);CHKERRQ(ierr); 8011b0f5fe93SStefano Zampini ierr = PetscMemcpy(array2,array,nl*sizeof(*array));CHKERRQ(ierr); 8012b0f5fe93SStefano Zampini ierr = VecRestoreArray(nullv,&array2);CHKERRQ(ierr); 8013b0f5fe93SStefano Zampini ierr = VecRestoreArrayRead(pcbddc->coarse_vec,(const PetscScalar**)&array);CHKERRQ(ierr); 8014b0f5fe93SStefano Zampini ierr = VecNormalize(nullv,NULL);CHKERRQ(ierr); 8015b0f5fe93SStefano Zampini ierr = MatNullSpaceCreate(PetscObjectComm((PetscObject)coarse_mat),PETSC_FALSE,1,&nullv,&CoarseNullSpace);CHKERRQ(ierr); 8016b0f5fe93SStefano Zampini ierr = VecDestroy(&nullv);CHKERRQ(ierr); 8017b0f5fe93SStefano Zampini } 8018b0f5fe93SStefano Zampini } 8019b0f5fe93SStefano Zampini 8020b0f5fe93SStefano Zampini if (pcbddc->coarse_ksp) { 8021b0f5fe93SStefano Zampini PetscBool ispreonly; 8022b0f5fe93SStefano Zampini 8023b0f5fe93SStefano Zampini if (CoarseNullSpace) { 8024b0f5fe93SStefano Zampini PetscBool isnull; 8025b0f5fe93SStefano Zampini ierr = MatNullSpaceTest(CoarseNullSpace,coarse_mat,&isnull);CHKERRQ(ierr); 8026bef83e63SStefano Zampini if (isnull) { 8027b0f5fe93SStefano Zampini ierr = MatSetNullSpace(coarse_mat,CoarseNullSpace);CHKERRQ(ierr); 8028b0f5fe93SStefano Zampini } 8029bef83e63SStefano Zampini /* TODO: add local nullspaces (if any) */ 8030b0f5fe93SStefano Zampini } 8031b0f5fe93SStefano Zampini /* setup coarse ksp */ 8032b0f5fe93SStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 8033cbcc2c2aSStefano Zampini /* Check coarse problem if in debug mode or if solving with an iterative method */ 8034cbcc2c2aSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcbddc->coarse_ksp,KSPPREONLY,&ispreonly);CHKERRQ(ierr); 80356e683305SStefano Zampini if (pcbddc->dbg_flag || (!ispreonly && pcbddc->use_coarse_estimates) ) { 8036c8587f34SStefano Zampini KSP check_ksp; 80372b510759SStefano Zampini KSPType check_ksp_type; 8038c8587f34SStefano Zampini PC check_pc; 80396e683305SStefano Zampini Vec check_vec,coarse_vec; 80406a1308c2SStefano Zampini PetscReal abs_infty_error,infty_error,lambda_min=1.0,lambda_max=1.0; 80412b510759SStefano Zampini PetscInt its; 80426e683305SStefano Zampini PetscBool compute_eigs; 80436e683305SStefano Zampini PetscReal *eigs_r,*eigs_c; 80446e683305SStefano Zampini PetscInt neigs; 80458e185a42SStefano Zampini const char *prefix; 8046c8587f34SStefano Zampini 80472b510759SStefano Zampini /* Create ksp object suitable for estimation of extreme eigenvalues */ 80486e683305SStefano Zampini ierr = KSPCreate(PetscObjectComm((PetscObject)pcbddc->coarse_ksp),&check_ksp);CHKERRQ(ierr); 8049422a814eSBarry Smith ierr = KSPSetErrorIfNotConverged(pcbddc->coarse_ksp,pc->erroriffailure);CHKERRQ(ierr); 805023ee1639SBarry Smith ierr = KSPSetOperators(check_ksp,coarse_mat,coarse_mat);CHKERRQ(ierr); 8051f4ddd8eeSStefano Zampini ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 8052e4d548c7SStefano Zampini /* prevent from setup unneeded object */ 8053e4d548c7SStefano Zampini ierr = KSPGetPC(check_ksp,&check_pc);CHKERRQ(ierr); 8054e4d548c7SStefano Zampini ierr = PCSetType(check_pc,PCNONE);CHKERRQ(ierr); 80552b510759SStefano Zampini if (ispreonly) { 80562b510759SStefano Zampini check_ksp_type = KSPPREONLY; 80576e683305SStefano Zampini compute_eigs = PETSC_FALSE; 80582b510759SStefano Zampini } else { 8059cbcc2c2aSStefano Zampini check_ksp_type = KSPGMRES; 80606e683305SStefano Zampini compute_eigs = PETSC_TRUE; 8061c8587f34SStefano Zampini } 8062c8587f34SStefano Zampini ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr); 80636e683305SStefano Zampini ierr = KSPSetComputeSingularValues(check_ksp,compute_eigs);CHKERRQ(ierr); 80646e683305SStefano Zampini ierr = KSPSetComputeEigenvalues(check_ksp,compute_eigs);CHKERRQ(ierr); 80656e683305SStefano Zampini ierr = KSPGMRESSetRestart(check_ksp,pcbddc->coarse_size+1);CHKERRQ(ierr); 8066a7dc3881SStefano Zampini ierr = KSPGetOptionsPrefix(pcbddc->coarse_ksp,&prefix);CHKERRQ(ierr); 8067a7dc3881SStefano Zampini ierr = KSPSetOptionsPrefix(check_ksp,prefix);CHKERRQ(ierr); 8068a7dc3881SStefano Zampini ierr = KSPAppendOptionsPrefix(check_ksp,"check_");CHKERRQ(ierr); 8069a7dc3881SStefano Zampini ierr = KSPSetFromOptions(check_ksp);CHKERRQ(ierr); 8070c8587f34SStefano Zampini ierr = KSPSetUp(check_ksp);CHKERRQ(ierr); 8071c8587f34SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr); 8072c8587f34SStefano Zampini ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr); 8073c8587f34SStefano Zampini /* create random vec */ 80742701bc32SStefano Zampini ierr = MatCreateVecs(coarse_mat,&coarse_vec,&check_vec);CHKERRQ(ierr); 8075c8587f34SStefano Zampini ierr = VecSetRandom(check_vec,NULL);CHKERRQ(ierr); 80766e683305SStefano Zampini ierr = MatMult(coarse_mat,check_vec,coarse_vec);CHKERRQ(ierr); 8077c8587f34SStefano Zampini /* solve coarse problem */ 80786e683305SStefano Zampini ierr = KSPSolve(check_ksp,coarse_vec,coarse_vec);CHKERRQ(ierr); 8079cbcc2c2aSStefano Zampini /* set eigenvalue estimation if preonly has not been requested */ 80806e683305SStefano Zampini if (compute_eigs) { 8081854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->coarse_size+1,&eigs_r);CHKERRQ(ierr); 8082854ce69bSBarry Smith ierr = PetscMalloc1(pcbddc->coarse_size+1,&eigs_c);CHKERRQ(ierr); 80836e683305SStefano Zampini ierr = KSPComputeEigenvalues(check_ksp,pcbddc->coarse_size+1,eigs_r,eigs_c,&neigs);CHKERRQ(ierr); 80841ae86dd6SStefano Zampini if (neigs) { 80856e683305SStefano Zampini lambda_max = eigs_r[neigs-1]; 80866e683305SStefano Zampini lambda_min = eigs_r[0]; 80876e683305SStefano Zampini if (pcbddc->use_coarse_estimates) { 80882701bc32SStefano Zampini if (lambda_max>=lambda_min) { /* using PETSC_SMALL since lambda_max == lambda_min is not allowed by KSPChebyshevSetEigenvalues */ 80892701bc32SStefano Zampini ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max+PETSC_SMALL,lambda_min);CHKERRQ(ierr); 8090cbcc2c2aSStefano Zampini ierr = KSPRichardsonSetScale(pcbddc->coarse_ksp,2.0/(lambda_max+lambda_min));CHKERRQ(ierr); 8091cbcc2c2aSStefano Zampini } 8092c8587f34SStefano Zampini } 8093c8587f34SStefano Zampini } 80941ae86dd6SStefano Zampini } 8095cbcc2c2aSStefano Zampini 8096c8587f34SStefano Zampini /* check coarse problem residual error */ 80976e683305SStefano Zampini if (pcbddc->dbg_flag) { 80986e683305SStefano Zampini PetscViewer dbg_viewer = PETSC_VIEWER_STDOUT_(PetscObjectComm((PetscObject)pcbddc->coarse_ksp)); 80996e683305SStefano Zampini ierr = PetscViewerASCIIAddTab(dbg_viewer,2*(pcbddc->current_level+1));CHKERRQ(ierr); 81006e683305SStefano Zampini ierr = VecAXPY(check_vec,-1.0,coarse_vec);CHKERRQ(ierr); 8101c8587f34SStefano Zampini ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 81026e683305SStefano Zampini ierr = MatMult(coarse_mat,check_vec,coarse_vec);CHKERRQ(ierr); 81036e683305SStefano Zampini ierr = VecNorm(coarse_vec,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr); 8104779c1cceSStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem details (use estimates %d)\n",pcbddc->use_coarse_estimates);CHKERRQ(ierr); 81056e683305SStefano Zampini ierr = PetscObjectPrintClassNamePrefixType((PetscObject)(pcbddc->coarse_ksp),dbg_viewer);CHKERRQ(ierr); 81066e683305SStefano Zampini ierr = PetscObjectPrintClassNamePrefixType((PetscObject)(check_pc),dbg_viewer);CHKERRQ(ierr); 81076e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem exact infty_error : %1.6e\n",infty_error);CHKERRQ(ierr); 81086e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem residual infty_error: %1.6e\n",abs_infty_error);CHKERRQ(ierr); 8109b0f5fe93SStefano Zampini if (CoarseNullSpace) { 8110b0f5fe93SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem is singular\n");CHKERRQ(ierr); 8111b0f5fe93SStefano Zampini } 81126e683305SStefano Zampini if (compute_eigs) { 81136e683305SStefano Zampini PetscReal lambda_max_s,lambda_min_s; 8114b03ebc13SStefano Zampini KSPConvergedReason reason; 8115deec49d1SStefano Zampini ierr = KSPGetType(check_ksp,&check_ksp_type);CHKERRQ(ierr); 8116c8587f34SStefano Zampini ierr = KSPGetIterationNumber(check_ksp,&its);CHKERRQ(ierr); 8117b03ebc13SStefano Zampini ierr = KSPGetConvergedReason(check_ksp,&reason);CHKERRQ(ierr); 81186e683305SStefano Zampini ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max_s,&lambda_min_s);CHKERRQ(ierr); 8119b03ebc13SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"Coarse problem eigenvalues (estimated with %d iterations of %s, conv reason %d): %1.6e %1.6e (%1.6e %1.6e)\n",its,check_ksp_type,reason,lambda_min,lambda_max,lambda_min_s,lambda_max_s);CHKERRQ(ierr); 81206e683305SStefano Zampini for (i=0;i<neigs;i++) { 81216e683305SStefano Zampini ierr = PetscViewerASCIIPrintf(dbg_viewer,"%1.6e %1.6ei\n",eigs_r[i],eigs_c[i]);CHKERRQ(ierr); 8122c8587f34SStefano Zampini } 81236e683305SStefano Zampini } 81246e683305SStefano Zampini ierr = PetscViewerFlush(dbg_viewer);CHKERRQ(ierr); 81256e683305SStefano Zampini ierr = PetscViewerASCIISubtractTab(dbg_viewer,2*(pcbddc->current_level+1));CHKERRQ(ierr); 81266e683305SStefano Zampini } 8127e4d548c7SStefano Zampini ierr = VecDestroy(&check_vec);CHKERRQ(ierr); 81282701bc32SStefano Zampini ierr = VecDestroy(&coarse_vec);CHKERRQ(ierr); 8129c8587f34SStefano Zampini ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr); 81306e683305SStefano Zampini if (compute_eigs) { 81316e683305SStefano Zampini ierr = PetscFree(eigs_r);CHKERRQ(ierr); 81326e683305SStefano Zampini ierr = PetscFree(eigs_c);CHKERRQ(ierr); 8133c8587f34SStefano Zampini } 81346e683305SStefano Zampini } 81356e683305SStefano Zampini } 8136bef83e63SStefano Zampini ierr = MatNullSpaceDestroy(&CoarseNullSpace);CHKERRQ(ierr); 8137cbcc2c2aSStefano Zampini /* print additional info */ 8138cbcc2c2aSStefano Zampini if (pcbddc->dbg_flag) { 81396e683305SStefano Zampini /* waits until all processes reaches this point */ 81406e683305SStefano Zampini ierr = PetscBarrier((PetscObject)pc);CHKERRQ(ierr); 8141cbcc2c2aSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Coarse solver setup completed at level %d\n",pcbddc->current_level);CHKERRQ(ierr); 8142cbcc2c2aSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8143cbcc2c2aSStefano Zampini } 8144cbcc2c2aSStefano Zampini 81452b510759SStefano Zampini /* free memory */ 8146fdc635d7SStefano Zampini ierr = MatDestroy(&coarse_mat);CHKERRQ(ierr); 8147c8587f34SStefano Zampini PetscFunctionReturn(0); 8148c8587f34SStefano Zampini } 8149674ae819SStefano Zampini 8150f34684f1SStefano Zampini PetscErrorCode PCBDDCComputePrimalNumbering(PC pc,PetscInt* coarse_size_n,PetscInt** local_primal_indices_n) 8151f34684f1SStefano Zampini { 8152f34684f1SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 8153f34684f1SStefano Zampini PC_IS* pcis = (PC_IS*)pc->data; 8154f34684f1SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 8155dc456d91SStefano Zampini IS subset,subset_mult,subset_n; 8156dc456d91SStefano Zampini PetscInt local_size,coarse_size=0; 815773be2a3aSStefano Zampini PetscInt *local_primal_indices=NULL; 8158dc456d91SStefano Zampini const PetscInt *t_local_primal_indices; 8159f34684f1SStefano Zampini PetscErrorCode ierr; 8160f34684f1SStefano Zampini 8161f34684f1SStefano Zampini PetscFunctionBegin; 8162f34684f1SStefano Zampini /* Compute global number of coarse dofs */ 81636c4ed002SBarry Smith if (pcbddc->local_primal_size && !pcbddc->local_primal_ref_node) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"BDDC ConstraintsSetUp should be called first"); 8164dc456d91SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(pc->pmat)),pcbddc->local_primal_size_cc,pcbddc->local_primal_ref_node,PETSC_COPY_VALUES,&subset_n);CHKERRQ(ierr); 81653bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pcis->mapping,subset_n,&subset);CHKERRQ(ierr); 8166dc456d91SStefano Zampini ierr = ISDestroy(&subset_n);CHKERRQ(ierr); 8167dc456d91SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(pc->pmat)),pcbddc->local_primal_size_cc,pcbddc->local_primal_ref_mult,PETSC_COPY_VALUES,&subset_mult);CHKERRQ(ierr); 81686583bcc1SStefano Zampini ierr = ISRenumber(subset,subset_mult,&coarse_size,&subset_n);CHKERRQ(ierr); 8169dc456d91SStefano Zampini ierr = ISDestroy(&subset);CHKERRQ(ierr); 8170dc456d91SStefano Zampini ierr = ISDestroy(&subset_mult);CHKERRQ(ierr); 8171dc456d91SStefano Zampini ierr = ISGetLocalSize(subset_n,&local_size);CHKERRQ(ierr); 81726c4ed002SBarry Smith if (local_size != pcbddc->local_primal_size) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Invalid number of local primal indices computed %D != %D",local_size,pcbddc->local_primal_size); 8173dc456d91SStefano Zampini ierr = PetscMalloc1(local_size,&local_primal_indices);CHKERRQ(ierr); 8174dc456d91SStefano Zampini ierr = ISGetIndices(subset_n,&t_local_primal_indices);CHKERRQ(ierr); 8175dc456d91SStefano Zampini ierr = PetscMemcpy(local_primal_indices,t_local_primal_indices,local_size*sizeof(PetscInt));CHKERRQ(ierr); 8176dc456d91SStefano Zampini ierr = ISRestoreIndices(subset_n,&t_local_primal_indices);CHKERRQ(ierr); 8177dc456d91SStefano Zampini ierr = ISDestroy(&subset_n);CHKERRQ(ierr); 8178f34684f1SStefano Zampini 8179f34684f1SStefano Zampini /* check numbering */ 8180f34684f1SStefano Zampini if (pcbddc->dbg_flag) { 8181019a44ceSStefano Zampini PetscScalar coarsesum,*array,*array2; 8182dc456d91SStefano Zampini PetscInt i; 8183b9b85e73SStefano Zampini PetscBool set_error = PETSC_FALSE,set_error_reduced = PETSC_FALSE; 8184f34684f1SStefano Zampini 8185f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8186f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 8187f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Check coarse indices\n");CHKERRQ(ierr); 81881575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8189019a44ceSStefano Zampini /* counter */ 8190019a44ceSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 8191019a44ceSStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 8192019a44ceSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8193019a44ceSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8194019a44ceSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8195019a44ceSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8196f34684f1SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 8197f34684f1SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 8198727cdba6SStefano Zampini ierr = VecSetValue(pcis->vec1_N,pcbddc->primal_indices_local_idxs[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 8199f34684f1SStefano Zampini } 8200f34684f1SStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 8201f34684f1SStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 8202f34684f1SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 8203e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8204e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8205e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8206e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8207f34684f1SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8208019a44ceSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 8209f34684f1SStefano Zampini for (i=0;i<pcis->n;i++) { 8210019a44ceSStefano Zampini if (array[i] != 0.0 && array[i] != array2[i]) { 82112c66d082SStefano Zampini PetscInt owned = (PetscInt)PetscRealPart(array[i]),gi; 821275c01103SStefano Zampini PetscInt neigh = (PetscInt)PetscRealPart(array2[i]); 8213b9b85e73SStefano Zampini set_error = PETSC_TRUE; 82142c66d082SStefano Zampini ierr = ISLocalToGlobalMappingApply(pcis->mapping,1,&i,&gi);CHKERRQ(ierr); 82152c66d082SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d: local index %d (gid %d) owned by %d processes instead of %d!\n",PetscGlobalRank,i,gi,owned,neigh);CHKERRQ(ierr); 8216f34684f1SStefano Zampini } 8217f34684f1SStefano Zampini } 8218019a44ceSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 8219b2566f29SBarry Smith ierr = MPIU_Allreduce(&set_error,&set_error_reduced,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 8220f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8221f34684f1SStefano Zampini for (i=0;i<pcis->n;i++) { 8222f34684f1SStefano Zampini if (PetscRealPart(array[i]) > 0.0) array[i] = 1.0/PetscRealPart(array[i]); 8223f34684f1SStefano Zampini } 8224f34684f1SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8225f34684f1SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 8226e176bc59SStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8227e176bc59SStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8228f34684f1SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 8229f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Size of coarse problem is %d (%lf)\n",coarse_size,PetscRealPart(coarsesum));CHKERRQ(ierr); 8230b9b85e73SStefano Zampini if (pcbddc->dbg_flag > 1 || set_error_reduced) { 8231ca8b9ea9SStefano Zampini PetscInt *gidxs; 8232ca8b9ea9SStefano Zampini 8233ca8b9ea9SStefano Zampini ierr = PetscMalloc1(pcbddc->local_primal_size,&gidxs);CHKERRQ(ierr); 82343bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingApply(pcis->mapping,pcbddc->local_primal_size,pcbddc->primal_indices_local_idxs,gidxs);CHKERRQ(ierr); 8235f34684f1SStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Distribution of local primal indices\n");CHKERRQ(ierr); 8236f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8237f34684f1SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 8238f34684f1SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 82394bc2dc4bSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"local_primal_indices[%d]=%d (%d,%d)\n",i,local_primal_indices[i],pcbddc->primal_indices_local_idxs[i],gidxs[i]);CHKERRQ(ierr); 8240f34684f1SStefano Zampini } 8241f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8242ca8b9ea9SStefano Zampini ierr = PetscFree(gidxs);CHKERRQ(ierr); 8243f34684f1SStefano Zampini } 8244f34684f1SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 82451575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8246302440fdSBarry Smith if (set_error_reduced) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"BDDC Numbering of coarse dofs failed"); 8247f34684f1SStefano Zampini } 82488bec7fa6SStefano Zampini /* ierr = PetscPrintf(PetscObjectComm((PetscObject)pc),"Size of coarse problem is %d\n",coarse_size);CHKERRQ(ierr); */ 8249f34684f1SStefano Zampini /* get back data */ 8250f34684f1SStefano Zampini *coarse_size_n = coarse_size; 8251f34684f1SStefano Zampini *local_primal_indices_n = local_primal_indices; 8252674ae819SStefano Zampini PetscFunctionReturn(0); 8253674ae819SStefano Zampini } 8254674ae819SStefano Zampini 8255a7dc3881SStefano Zampini PetscErrorCode PCBDDCGlobalToLocal(VecScatter g2l_ctx,Vec gwork, Vec lwork, IS globalis, IS* localis) 8256e456f2a8SStefano Zampini { 8257e456f2a8SStefano Zampini IS localis_t; 8258a7dc3881SStefano Zampini PetscInt i,lsize,*idxs,n; 8259e456f2a8SStefano Zampini PetscScalar *vals; 8260e456f2a8SStefano Zampini PetscErrorCode ierr; 8261e456f2a8SStefano Zampini 8262e456f2a8SStefano Zampini PetscFunctionBegin; 8263a7dc3881SStefano Zampini /* get indices in local ordering exploiting local to global map */ 8264e456f2a8SStefano Zampini ierr = ISGetLocalSize(globalis,&lsize);CHKERRQ(ierr); 8265854ce69bSBarry Smith ierr = PetscMalloc1(lsize,&vals);CHKERRQ(ierr); 8266e456f2a8SStefano Zampini for (i=0;i<lsize;i++) vals[i] = 1.0; 8267e456f2a8SStefano Zampini ierr = ISGetIndices(globalis,(const PetscInt**)&idxs);CHKERRQ(ierr); 8268a7dc3881SStefano Zampini ierr = VecSet(gwork,0.0);CHKERRQ(ierr); 8269a7dc3881SStefano Zampini ierr = VecSet(lwork,0.0);CHKERRQ(ierr); 82701035eff8SStefano Zampini if (idxs) { /* multilevel guard */ 8271a7dc3881SStefano Zampini ierr = VecSetValues(gwork,lsize,idxs,vals,INSERT_VALUES);CHKERRQ(ierr); 82721035eff8SStefano Zampini } 8273a7dc3881SStefano Zampini ierr = VecAssemblyBegin(gwork);CHKERRQ(ierr); 8274e456f2a8SStefano Zampini ierr = ISRestoreIndices(globalis,(const PetscInt**)&idxs);CHKERRQ(ierr); 8275e456f2a8SStefano Zampini ierr = PetscFree(vals);CHKERRQ(ierr); 8276a7dc3881SStefano Zampini ierr = VecAssemblyEnd(gwork);CHKERRQ(ierr); 8277a7dc3881SStefano Zampini /* now compute set in local ordering */ 8278a7dc3881SStefano Zampini ierr = VecScatterBegin(g2l_ctx,gwork,lwork,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8279a7dc3881SStefano Zampini ierr = VecScatterEnd(g2l_ctx,gwork,lwork,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8280a7dc3881SStefano Zampini ierr = VecGetArrayRead(lwork,(const PetscScalar**)&vals);CHKERRQ(ierr); 8281a7dc3881SStefano Zampini ierr = VecGetSize(lwork,&n);CHKERRQ(ierr); 8282a7dc3881SStefano Zampini for (i=0,lsize=0;i<n;i++) { 8283ff92baa0SMatthew G. Knepley if (PetscRealPart(vals[i]) > 0.5) { 8284e456f2a8SStefano Zampini lsize++; 8285e456f2a8SStefano Zampini } 8286e456f2a8SStefano Zampini } 8287854ce69bSBarry Smith ierr = PetscMalloc1(lsize,&idxs);CHKERRQ(ierr); 8288a7dc3881SStefano Zampini for (i=0,lsize=0;i<n;i++) { 8289ff92baa0SMatthew G. Knepley if (PetscRealPart(vals[i]) > 0.5) { 8290e456f2a8SStefano Zampini idxs[lsize++] = i; 8291e456f2a8SStefano Zampini } 8292e456f2a8SStefano Zampini } 8293a7dc3881SStefano Zampini ierr = VecRestoreArrayRead(lwork,(const PetscScalar**)&vals);CHKERRQ(ierr); 8294a7dc3881SStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)gwork),lsize,idxs,PETSC_OWN_POINTER,&localis_t);CHKERRQ(ierr); 8295e456f2a8SStefano Zampini *localis = localis_t; 8296e456f2a8SStefano Zampini PetscFunctionReturn(0); 8297e456f2a8SStefano Zampini } 8298906d46d4SStefano Zampini 829908122e43SStefano Zampini PetscErrorCode PCBDDCSetUpSubSchurs(PC pc) 8300b96c3477SStefano Zampini { 8301a64f4aa4SStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 8302b96c3477SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 8303b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs=pcbddc->sub_schurs; 8304a64f4aa4SStefano Zampini Mat S_j; 8305b96c3477SStefano Zampini PetscInt *used_xadj,*used_adjncy; 8306b96c3477SStefano Zampini PetscBool free_used_adj; 8307b96c3477SStefano Zampini PetscErrorCode ierr; 8308b96c3477SStefano Zampini 8309b96c3477SStefano Zampini PetscFunctionBegin; 8310b96c3477SStefano Zampini /* decide the adjacency to be used for determining internal problems for local schur on subsets */ 8311b96c3477SStefano Zampini free_used_adj = PETSC_FALSE; 831208122e43SStefano Zampini if (pcbddc->sub_schurs_layers == -1) { 8313b96c3477SStefano Zampini used_xadj = NULL; 8314b96c3477SStefano Zampini used_adjncy = NULL; 8315b96c3477SStefano Zampini } else { 831608122e43SStefano Zampini if (pcbddc->sub_schurs_use_useradj && pcbddc->mat_graph->xadj) { 831708122e43SStefano Zampini used_xadj = pcbddc->mat_graph->xadj; 831808122e43SStefano Zampini used_adjncy = pcbddc->mat_graph->adjncy; 831908122e43SStefano Zampini } else if (pcbddc->computed_rowadj) { 8320b96c3477SStefano Zampini used_xadj = pcbddc->mat_graph->xadj; 8321b96c3477SStefano Zampini used_adjncy = pcbddc->mat_graph->adjncy; 8322b96c3477SStefano Zampini } else { 83232fffb893SStefano Zampini PetscBool flg_row=PETSC_FALSE; 8324b96c3477SStefano Zampini const PetscInt *xadj,*adjncy; 8325b96c3477SStefano Zampini PetscInt nvtxs; 8326b96c3477SStefano Zampini 83272fffb893SStefano Zampini ierr = MatGetRowIJ(pcbddc->local_mat,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 83282fffb893SStefano Zampini if (flg_row) { 8329b96c3477SStefano Zampini ierr = PetscMalloc2(nvtxs+1,&used_xadj,xadj[nvtxs],&used_adjncy);CHKERRQ(ierr); 8330b96c3477SStefano Zampini ierr = PetscMemcpy(used_xadj,xadj,(nvtxs+1)*sizeof(*xadj));CHKERRQ(ierr); 8331b96c3477SStefano Zampini ierr = PetscMemcpy(used_adjncy,adjncy,(xadj[nvtxs])*sizeof(*adjncy));CHKERRQ(ierr); 8332b96c3477SStefano Zampini free_used_adj = PETSC_TRUE; 83332fffb893SStefano Zampini } else { 83342fffb893SStefano Zampini pcbddc->sub_schurs_layers = -1; 83352fffb893SStefano Zampini used_xadj = NULL; 83362fffb893SStefano Zampini used_adjncy = NULL; 83372fffb893SStefano Zampini } 83382fffb893SStefano Zampini ierr = MatRestoreRowIJ(pcbddc->local_mat,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 8339b96c3477SStefano Zampini } 8340b96c3477SStefano Zampini } 8341d5574798SStefano Zampini 8342d5574798SStefano Zampini /* setup sub_schurs data */ 8343a64f4aa4SStefano Zampini ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr); 8344df4d28bfSStefano Zampini if (!sub_schurs->schur_explicit) { 8345df4d28bfSStefano Zampini /* pcbddc->ksp_D up to date only if not using MatFactor with Schur complement support */ 8346a64f4aa4SStefano Zampini ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr); 834791af6908SStefano Zampini ierr = PCBDDCSubSchursSetUp(sub_schurs,NULL,S_j,PETSC_FALSE,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,NULL,pcbddc->adaptive_selection,PETSC_FALSE,PETSC_FALSE,0,NULL,NULL,NULL,NULL);CHKERRQ(ierr); 8348a64f4aa4SStefano Zampini } else { 834972b8c272SStefano Zampini Mat change = NULL; 83509d54b7f4SStefano Zampini Vec scaling = NULL; 8351111315fdSstefano_zampini IS change_primal = NULL, iP; 8352111315fdSstefano_zampini PetscInt benign_n; 8353111315fdSstefano_zampini PetscBool reuse_solvers = (PetscBool)!pcbddc->use_change_of_basis; 8354111315fdSstefano_zampini PetscBool isseqaij,need_change = PETSC_FALSE; 8355111315fdSstefano_zampini PetscBool discrete_harmonic = PETSC_FALSE; 8356a3df083aSStefano Zampini 83575feab87aSStefano Zampini if (!pcbddc->use_vertices && reuse_solvers) { 83585feab87aSStefano Zampini PetscInt n_vertices; 83595feab87aSStefano Zampini 83605feab87aSStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_vertices,&n_vertices);CHKERRQ(ierr); 83612034aafcSStefano Zampini reuse_solvers = (PetscBool)!n_vertices; 83625feab87aSStefano Zampini } 836304708bb6SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pcbddc->local_mat,MATSEQAIJ,&isseqaij);CHKERRQ(ierr); 836404708bb6SStefano Zampini if (!isseqaij) { 836504708bb6SStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 836604708bb6SStefano Zampini if (matis->A == pcbddc->local_mat) { 836704708bb6SStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 836804708bb6SStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 836904708bb6SStefano Zampini } else { 8370511c6705SHong Zhang ierr = MatConvert(pcbddc->local_mat,MATSEQAIJ,MAT_INPLACE_MATRIX,&pcbddc->local_mat);CHKERRQ(ierr); 837104708bb6SStefano Zampini } 837204708bb6SStefano Zampini } 8373a3df083aSStefano Zampini if (!pcbddc->benign_change_explicit) { 8374a3df083aSStefano Zampini benign_n = pcbddc->benign_n; 8375ca92afb2SStefano Zampini } else { 8376a3df083aSStefano Zampini benign_n = 0; 8377ca92afb2SStefano Zampini } 8378b7ab4a40SStefano Zampini /* sub_schurs->change is a local object; instead, PCBDDCConstraintsSetUp and the quantities used in the test below are logically collective on pc. 8379b7ab4a40SStefano Zampini We need a global reduction to avoid possible deadlocks. 8380b7ab4a40SStefano Zampini We assume that sub_schurs->change is created once, and then reused for different solves, unless the topography has been recomputed */ 838172b8c272SStefano Zampini if (pcbddc->adaptive_userdefined || (pcbddc->deluxe_zerorows && !pcbddc->use_change_of_basis)) { 838222db5ddcSStefano Zampini PetscBool have_loc_change = (PetscBool)(!!sub_schurs->change); 8383b7ab4a40SStefano Zampini ierr = MPIU_Allreduce(&have_loc_change,&need_change,1,MPIU_BOOL,MPI_LOR,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 838422db5ddcSStefano Zampini need_change = (PetscBool)(!need_change); 8385b7ab4a40SStefano Zampini } 8386b7ab4a40SStefano Zampini /* If the user defines additional constraints, we import them here. 8387b7ab4a40SStefano Zampini We need to compute the change of basis according to the quadrature weights attached to pmat via MatSetNearNullSpace, and this could not be done (at the moment) without some hacking */ 8388b7ab4a40SStefano Zampini if (need_change) { 838988c03ad3SStefano Zampini PC_IS *pcisf; 839088c03ad3SStefano Zampini PC_BDDC *pcbddcf; 839188c03ad3SStefano Zampini PC pcf; 839288c03ad3SStefano Zampini 8393e4d548c7SStefano Zampini if (pcbddc->sub_schurs_rebuild) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot compute change of basis with a different graph"); 839488c03ad3SStefano Zampini ierr = PCCreate(PetscObjectComm((PetscObject)pc),&pcf);CHKERRQ(ierr); 839588c03ad3SStefano Zampini ierr = PCSetOperators(pcf,pc->mat,pc->pmat);CHKERRQ(ierr); 839688c03ad3SStefano Zampini ierr = PCSetType(pcf,PCBDDC);CHKERRQ(ierr); 8397b9be95fcSstefano_zampini 839888c03ad3SStefano Zampini /* hacks */ 839988c03ad3SStefano Zampini pcisf = (PC_IS*)pcf->data; 840072b8c272SStefano Zampini pcisf->is_B_local = pcis->is_B_local; 840172b8c272SStefano Zampini pcisf->vec1_N = pcis->vec1_N; 840272b8c272SStefano Zampini pcisf->BtoNmap = pcis->BtoNmap; 840372b8c272SStefano Zampini pcisf->n = pcis->n; 840472b8c272SStefano Zampini pcisf->n_B = pcis->n_B; 840588c03ad3SStefano Zampini pcbddcf = (PC_BDDC*)pcf->data; 840688c03ad3SStefano Zampini ierr = PetscFree(pcbddcf->mat_graph);CHKERRQ(ierr); 840788c03ad3SStefano Zampini pcbddcf->mat_graph = pcbddc->mat_graph; 840888c03ad3SStefano Zampini pcbddcf->use_faces = PETSC_TRUE; 840988c03ad3SStefano Zampini pcbddcf->use_change_of_basis = PETSC_TRUE; 841088c03ad3SStefano Zampini pcbddcf->use_change_on_faces = PETSC_TRUE; 841172b8c272SStefano Zampini pcbddcf->use_qr_single = PETSC_TRUE; 841288c03ad3SStefano Zampini pcbddcf->fake_change = PETSC_TRUE; 8413b9be95fcSstefano_zampini 8414b9be95fcSstefano_zampini /* setup constraints so that we can get information on primal vertices and change of basis (in local numbering) */ 841588c03ad3SStefano Zampini ierr = PCBDDCConstraintsSetUp(pcf);CHKERRQ(ierr); 841672b8c272SStefano Zampini sub_schurs->change_with_qr = pcbddcf->use_qr_single; 841772b8c272SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddcf->n_vertices,pcbddcf->local_primal_ref_node,PETSC_COPY_VALUES,&change_primal);CHKERRQ(ierr); 841872b8c272SStefano Zampini change = pcbddcf->ConstraintMatrix; 841972b8c272SStefano Zampini pcbddcf->ConstraintMatrix = NULL; 8420b9be95fcSstefano_zampini 842188c03ad3SStefano Zampini /* free unneeded memory allocated in PCBDDCConstraintsSetUp */ 842272b8c272SStefano Zampini ierr = PetscFree(pcbddcf->sub_schurs);CHKERRQ(ierr); 842388c03ad3SStefano Zampini ierr = MatNullSpaceDestroy(&pcbddcf->onearnullspace);CHKERRQ(ierr); 842488c03ad3SStefano Zampini ierr = PetscFree2(pcbddcf->local_primal_ref_node,pcbddcf->local_primal_ref_mult);CHKERRQ(ierr); 842588c03ad3SStefano Zampini ierr = PetscFree(pcbddcf->primal_indices_local_idxs);CHKERRQ(ierr); 842688c03ad3SStefano Zampini ierr = PetscFree(pcbddcf->onearnullvecs_state);CHKERRQ(ierr); 842788c03ad3SStefano Zampini ierr = PetscFree(pcf->data);CHKERRQ(ierr); 842888c03ad3SStefano Zampini pcf->ops->destroy = NULL; 8429b9be95fcSstefano_zampini pcf->ops->reset = NULL; 843088c03ad3SStefano Zampini ierr = PCDestroy(&pcf);CHKERRQ(ierr); 843188c03ad3SStefano Zampini } 84329d54b7f4SStefano Zampini if (!pcbddc->use_deluxe_scaling) scaling = pcis->D; 8433111315fdSstefano_zampini 8434111315fdSstefano_zampini ierr = PetscObjectQuery((PetscObject)pc,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr); 8435111315fdSstefano_zampini if (iP) { 8436111315fdSstefano_zampini ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)iP),sub_schurs->prefix,"BDDC sub_schurs options","PC");CHKERRQ(ierr); 8437111315fdSstefano_zampini ierr = PetscOptionsBool("-sub_schurs_discrete_harmonic",NULL,NULL,discrete_harmonic,&discrete_harmonic,NULL);CHKERRQ(ierr); 8438111315fdSstefano_zampini ierr = PetscOptionsEnd();CHKERRQ(ierr); 8439111315fdSstefano_zampini } 8440111315fdSstefano_zampini if (discrete_harmonic) { 8441111315fdSstefano_zampini Mat A; 8442111315fdSstefano_zampini ierr = MatDuplicate(pcbddc->local_mat,MAT_COPY_VALUES,&A);CHKERRQ(ierr); 8443111315fdSstefano_zampini ierr = MatZeroRowsColumnsIS(A,iP,1.0,NULL,NULL);CHKERRQ(ierr); 8444111315fdSstefano_zampini ierr = PetscObjectCompose((PetscObject)A,"__KSPFETIDP_iP",(PetscObject)iP);CHKERRQ(ierr); 8445111315fdSstefano_zampini ierr = PCBDDCSubSchursSetUp(sub_schurs,A,S_j,pcbddc->sub_schurs_exact_schur,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,scaling,pcbddc->adaptive_selection,reuse_solvers,pcbddc->benign_saddle_point,benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_zerodiag_subs,change,change_primal);CHKERRQ(ierr); 8446111315fdSstefano_zampini ierr = MatDestroy(&A);CHKERRQ(ierr); 8447111315fdSstefano_zampini } else { 844891af6908SStefano Zampini ierr = PCBDDCSubSchursSetUp(sub_schurs,pcbddc->local_mat,S_j,pcbddc->sub_schurs_exact_schur,used_xadj,used_adjncy,pcbddc->sub_schurs_layers,scaling,pcbddc->adaptive_selection,reuse_solvers,pcbddc->benign_saddle_point,benign_n,pcbddc->benign_p0_lidx,pcbddc->benign_zerodiag_subs,change,change_primal);CHKERRQ(ierr); 8449111315fdSstefano_zampini } 845072b8c272SStefano Zampini ierr = MatDestroy(&change);CHKERRQ(ierr); 845172b8c272SStefano Zampini ierr = ISDestroy(&change_primal);CHKERRQ(ierr); 8452ca92afb2SStefano Zampini } 8453d12d3064SStefano Zampini ierr = MatDestroy(&S_j);CHKERRQ(ierr); 8454b96c3477SStefano Zampini 8455b96c3477SStefano Zampini /* free adjacency */ 8456b96c3477SStefano Zampini if (free_used_adj) { 8457b96c3477SStefano Zampini ierr = PetscFree2(used_xadj,used_adjncy);CHKERRQ(ierr); 8458b96c3477SStefano Zampini } 8459b96c3477SStefano Zampini PetscFunctionReturn(0); 8460b96c3477SStefano Zampini } 8461b96c3477SStefano Zampini 846208122e43SStefano Zampini PetscErrorCode PCBDDCInitSubSchurs(PC pc) 8463b96c3477SStefano Zampini { 8464b96c3477SStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 8465b96c3477SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 8466b96c3477SStefano Zampini PCBDDCGraph graph; 8467b96c3477SStefano Zampini PetscErrorCode ierr; 8468b96c3477SStefano Zampini 8469b96c3477SStefano Zampini PetscFunctionBegin; 8470b96c3477SStefano Zampini /* attach interface graph for determining subsets */ 847108122e43SStefano Zampini if (pcbddc->sub_schurs_rebuild) { /* in case rebuild has been requested, it uses a graph generated only by the neighbouring information */ 84723301b35fSStefano Zampini IS verticesIS,verticescomm; 84733301b35fSStefano Zampini PetscInt vsize,*idxs; 8474b96c3477SStefano Zampini 8475b96c3477SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&verticesIS);CHKERRQ(ierr); 84763301b35fSStefano Zampini ierr = ISGetSize(verticesIS,&vsize);CHKERRQ(ierr); 84773301b35fSStefano Zampini ierr = ISGetIndices(verticesIS,(const PetscInt**)&idxs);CHKERRQ(ierr); 84783301b35fSStefano Zampini ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),vsize,idxs,PETSC_COPY_VALUES,&verticescomm);CHKERRQ(ierr); 84793301b35fSStefano Zampini ierr = ISRestoreIndices(verticesIS,(const PetscInt**)&idxs);CHKERRQ(ierr); 8480c8272957SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&verticesIS);CHKERRQ(ierr); 8481b96c3477SStefano Zampini ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr); 8482be12c134Sstefano_zampini ierr = PCBDDCGraphInit(graph,pcbddc->mat_graph->l2gmap,pcbddc->mat_graph->nvtxs_global,pcbddc->graphmaxcount);CHKERRQ(ierr); 8483441e0de0SStefano Zampini ierr = PCBDDCGraphSetUp(graph,pcbddc->mat_graph->custom_minimal_size,NULL,pcbddc->DirichletBoundariesLocal,0,NULL,verticescomm);CHKERRQ(ierr); 84843301b35fSStefano Zampini ierr = ISDestroy(&verticescomm);CHKERRQ(ierr); 8485b96c3477SStefano Zampini ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr); 8486b96c3477SStefano Zampini } else { 8487b96c3477SStefano Zampini graph = pcbddc->mat_graph; 8488b96c3477SStefano Zampini } 8489e4d548c7SStefano Zampini /* print some info */ 84905c643e28SStefano Zampini if (pcbddc->dbg_flag && !pcbddc->sub_schurs_rebuild) { 8491e4d548c7SStefano Zampini IS vertices; 8492e4d548c7SStefano Zampini PetscInt nv,nedges,nfaces; 8493c8272957SStefano Zampini ierr = PCBDDCGraphASCIIView(graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr); 8494e4d548c7SStefano Zampini ierr = PCBDDCGraphGetCandidatesIS(graph,&nfaces,NULL,&nedges,NULL,&vertices);CHKERRQ(ierr); 8495e4d548c7SStefano Zampini ierr = ISGetSize(vertices,&nv);CHKERRQ(ierr); 8496e4d548c7SStefano Zampini ierr = PetscViewerASCIIPushSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8497e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 8498e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate vertices (%d)\n",PetscGlobalRank,nv,pcbddc->use_vertices);CHKERRQ(ierr); 8499e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate edges (%d)\n",PetscGlobalRank,nedges,pcbddc->use_edges);CHKERRQ(ierr); 8500e4d548c7SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Subdomain %04d got %02d local candidate faces (%d)\n",PetscGlobalRank,nfaces,pcbddc->use_faces);CHKERRQ(ierr); 8501e4d548c7SStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 8502e4d548c7SStefano Zampini ierr = PetscViewerASCIIPopSynchronized(pcbddc->dbg_viewer);CHKERRQ(ierr); 8503c8272957SStefano Zampini ierr = PCBDDCGraphRestoreCandidatesIS(graph,&nfaces,NULL,&nedges,NULL,&vertices);CHKERRQ(ierr); 8504e4d548c7SStefano Zampini } 8505b96c3477SStefano Zampini 8506b96c3477SStefano Zampini /* sub_schurs init */ 8507b334f244SStefano Zampini if (!pcbddc->sub_schurs) { 8508b334f244SStefano Zampini ierr = PCBDDCSubSchursCreate(&pcbddc->sub_schurs);CHKERRQ(ierr); 8509b334f244SStefano Zampini } 85108b6046baSStefano Zampini ierr = PCBDDCSubSchursInit(pcbddc->sub_schurs,pcis->is_I_local,pcis->is_B_local,graph,pcis->BtoNmap,pcbddc->sub_schurs_rebuild);CHKERRQ(ierr); 8511e62b6521Sstefano_zampini pcbddc->sub_schurs->prefix = ((PetscObject)pc)->prefix; 8512a64f4aa4SStefano Zampini 8513b96c3477SStefano Zampini /* free graph struct */ 851408122e43SStefano Zampini if (pcbddc->sub_schurs_rebuild) { 8515b96c3477SStefano Zampini ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr); 8516b96c3477SStefano Zampini } 8517b96c3477SStefano Zampini PetscFunctionReturn(0); 8518b96c3477SStefano Zampini } 8519fa34dd3eSStefano Zampini 8520fa34dd3eSStefano Zampini PetscErrorCode PCBDDCCheckOperator(PC pc) 8521fa34dd3eSStefano Zampini { 8522fa34dd3eSStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 8523fa34dd3eSStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 8524fa34dd3eSStefano Zampini PetscErrorCode ierr; 8525fa34dd3eSStefano Zampini 8526fa34dd3eSStefano Zampini PetscFunctionBegin; 8527fa34dd3eSStefano Zampini if (pcbddc->n_vertices == pcbddc->local_primal_size) { 8528fa34dd3eSStefano Zampini IS zerodiag = NULL; 85294f1b2e48SStefano Zampini Mat S_j,B0_B=NULL; 8530fa34dd3eSStefano Zampini Vec dummy_vec=NULL,vec_check_B,vec_scale_P; 85314f1b2e48SStefano Zampini PetscScalar *p0_check,*array,*array2; 853275c01103SStefano Zampini PetscReal norm; 8533fa34dd3eSStefano Zampini PetscInt i; 8534fa34dd3eSStefano Zampini 8535fa34dd3eSStefano Zampini /* B0 and B0_B */ 8536fa34dd3eSStefano Zampini if (zerodiag) { 8537fa34dd3eSStefano Zampini IS dummy; 8538fa34dd3eSStefano Zampini 85394f1b2e48SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->benign_n,0,1,&dummy);CHKERRQ(ierr); 85407dae84e0SHong Zhang ierr = MatCreateSubMatrix(pcbddc->benign_B0,dummy,pcis->is_B_local,MAT_INITIAL_MATRIX,&B0_B);CHKERRQ(ierr); 8541fa34dd3eSStefano Zampini ierr = MatCreateVecs(B0_B,NULL,&dummy_vec);CHKERRQ(ierr); 8542fa34dd3eSStefano Zampini ierr = ISDestroy(&dummy);CHKERRQ(ierr); 8543fa34dd3eSStefano Zampini } 8544fa34dd3eSStefano Zampini /* I need a primal vector to scale primal nodes since BDDC sums contibutions */ 8545fa34dd3eSStefano Zampini ierr = VecDuplicate(pcbddc->vec1_P,&vec_scale_P);CHKERRQ(ierr); 8546fa34dd3eSStefano Zampini ierr = VecSet(pcbddc->vec1_P,1.0);CHKERRQ(ierr); 8547fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8548fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8549fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,vec_scale_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8550fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,vec_scale_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8551fa34dd3eSStefano Zampini ierr = VecReciprocal(vec_scale_P);CHKERRQ(ierr); 8552fa34dd3eSStefano Zampini /* S_j */ 8553fa34dd3eSStefano Zampini ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr); 8554fa34dd3eSStefano Zampini ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr); 8555fa34dd3eSStefano Zampini 8556fa34dd3eSStefano Zampini /* mimic vector in \widetilde{W}_\Gamma */ 8557fa34dd3eSStefano Zampini ierr = VecSetRandom(pcis->vec1_N,NULL);CHKERRQ(ierr); 8558fa34dd3eSStefano Zampini /* continuous in primal space */ 8559fa34dd3eSStefano Zampini ierr = VecSetRandom(pcbddc->coarse_vec,NULL);CHKERRQ(ierr); 8560fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8561fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8562fa34dd3eSStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 85634f1b2e48SStefano Zampini ierr = PetscCalloc1(pcbddc->benign_n,&p0_check);CHKERRQ(ierr); 85644f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) p0_check[i] = array[pcbddc->local_primal_size-pcbddc->benign_n+i]; 8565fa34dd3eSStefano Zampini ierr = VecSetValues(pcis->vec1_N,pcbddc->local_primal_size,pcbddc->local_primal_ref_node,array,INSERT_VALUES);CHKERRQ(ierr); 8566fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 8567fa34dd3eSStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 8568fa34dd3eSStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 8569fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8570fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8571fa34dd3eSStefano Zampini ierr = VecDuplicate(pcis->vec2_B,&vec_check_B);CHKERRQ(ierr); 8572fa34dd3eSStefano Zampini ierr = VecCopy(pcis->vec2_B,vec_check_B);CHKERRQ(ierr); 8573fa34dd3eSStefano Zampini 8574fa34dd3eSStefano Zampini /* assemble rhs for coarse problem */ 8575fa34dd3eSStefano Zampini /* widetilde{S}_\Gamma w_\Gamma + \widetilde{B0}^T_B p0 */ 8576fa34dd3eSStefano Zampini /* local with Schur */ 8577fa34dd3eSStefano Zampini ierr = MatMult(S_j,pcis->vec2_B,pcis->vec1_B);CHKERRQ(ierr); 8578fa34dd3eSStefano Zampini if (zerodiag) { 8579fa34dd3eSStefano Zampini ierr = VecGetArray(dummy_vec,&array);CHKERRQ(ierr); 85804f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) array[i] = p0_check[i]; 8581fa34dd3eSStefano Zampini ierr = VecRestoreArray(dummy_vec,&array);CHKERRQ(ierr); 8582fa34dd3eSStefano Zampini ierr = MatMultTransposeAdd(B0_B,dummy_vec,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 8583fa34dd3eSStefano Zampini } 8584fa34dd3eSStefano Zampini /* sum on primal nodes the local contributions */ 8585fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8586fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8587fa34dd3eSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8588fa34dd3eSStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 8589fa34dd3eSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) array2[i] = array[pcbddc->local_primal_ref_node[i]]; 8590fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 8591fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 8592fa34dd3eSStefano Zampini ierr = VecSet(pcbddc->coarse_vec,0.);CHKERRQ(ierr); 8593fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8594fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->vec1_P,pcbddc->coarse_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8595fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8596fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8597fa34dd3eSStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 8598fa34dd3eSStefano Zampini /* scale primal nodes (BDDC sums contibutions) */ 8599fa34dd3eSStefano Zampini ierr = VecPointwiseMult(pcbddc->vec1_P,vec_scale_P,pcbddc->vec1_P);CHKERRQ(ierr); 8600fa34dd3eSStefano Zampini ierr = VecSetValues(pcis->vec1_N,pcbddc->local_primal_size,pcbddc->local_primal_ref_node,array,INSERT_VALUES);CHKERRQ(ierr); 8601fa34dd3eSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 8602fa34dd3eSStefano Zampini ierr = VecAssemblyBegin(pcis->vec1_N);CHKERRQ(ierr); 8603fa34dd3eSStefano Zampini ierr = VecAssemblyEnd(pcis->vec1_N);CHKERRQ(ierr); 8604fa34dd3eSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8605fa34dd3eSStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8606fa34dd3eSStefano Zampini /* global: \widetilde{B0}_B w_\Gamma */ 8607fa34dd3eSStefano Zampini if (zerodiag) { 8608fa34dd3eSStefano Zampini ierr = MatMult(B0_B,pcis->vec2_B,dummy_vec);CHKERRQ(ierr); 8609fa34dd3eSStefano Zampini ierr = VecGetArray(dummy_vec,&array);CHKERRQ(ierr); 86104f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) pcbddc->benign_p0[i] = array[i]; 8611fa34dd3eSStefano Zampini ierr = VecRestoreArray(dummy_vec,&array);CHKERRQ(ierr); 8612fa34dd3eSStefano Zampini } 8613fa34dd3eSStefano Zampini /* BDDC */ 8614fa34dd3eSStefano Zampini ierr = VecSet(pcis->vec1_D,0.);CHKERRQ(ierr); 8615fa34dd3eSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc,PETSC_FALSE);CHKERRQ(ierr); 8616fa34dd3eSStefano Zampini 8617fa34dd3eSStefano Zampini ierr = VecCopy(pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 8618fa34dd3eSStefano Zampini ierr = VecAXPY(pcis->vec1_B,-1.0,vec_check_B);CHKERRQ(ierr); 8619fa34dd3eSStefano Zampini ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&norm);CHKERRQ(ierr); 8620fa34dd3eSStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] BDDC local error is %1.4e\n",PetscGlobalRank,norm); 86214f1b2e48SStefano Zampini for (i=0;i<pcbddc->benign_n;i++) { 86224f1b2e48SStefano Zampini PetscPrintf(PETSC_COMM_SELF,"[%d] BDDC p0[%d] error is %1.4e\n",PetscGlobalRank,i,PetscAbsScalar(pcbddc->benign_p0[i]-p0_check[i])); 8623fa34dd3eSStefano Zampini } 86244f1b2e48SStefano Zampini ierr = PetscFree(p0_check);CHKERRQ(ierr); 8625fa34dd3eSStefano Zampini ierr = VecDestroy(&vec_scale_P);CHKERRQ(ierr); 8626fa34dd3eSStefano Zampini ierr = VecDestroy(&vec_check_B);CHKERRQ(ierr); 8627fa34dd3eSStefano Zampini ierr = VecDestroy(&dummy_vec);CHKERRQ(ierr); 8628fa34dd3eSStefano Zampini ierr = MatDestroy(&S_j);CHKERRQ(ierr); 8629fa34dd3eSStefano Zampini ierr = MatDestroy(&B0_B);CHKERRQ(ierr); 8630fa34dd3eSStefano Zampini } 8631fa34dd3eSStefano Zampini PetscFunctionReturn(0); 8632fa34dd3eSStefano Zampini } 86331e0482f5SStefano Zampini 86341e0482f5SStefano Zampini #include <../src/mat/impls/aij/mpi/mpiaij.h> 86351e0482f5SStefano Zampini PetscErrorCode MatMPIAIJRestrict(Mat A, MPI_Comm ccomm, Mat *B) 86361e0482f5SStefano Zampini { 86371e0482f5SStefano Zampini Mat At; 86381e0482f5SStefano Zampini IS rows; 86391e0482f5SStefano Zampini PetscInt rst,ren; 86401e0482f5SStefano Zampini PetscErrorCode ierr; 86411e0482f5SStefano Zampini PetscLayout rmap; 86421e0482f5SStefano Zampini 86431e0482f5SStefano Zampini PetscFunctionBegin; 86441e0482f5SStefano Zampini rst = ren = 0; 86451e0482f5SStefano Zampini if (ccomm != MPI_COMM_NULL) { 86461e0482f5SStefano Zampini ierr = PetscLayoutCreate(ccomm,&rmap);CHKERRQ(ierr); 86471e0482f5SStefano Zampini ierr = PetscLayoutSetSize(rmap,A->rmap->N);CHKERRQ(ierr); 86481e0482f5SStefano Zampini ierr = PetscLayoutSetBlockSize(rmap,1);CHKERRQ(ierr); 86491e0482f5SStefano Zampini ierr = PetscLayoutSetUp(rmap);CHKERRQ(ierr); 86501e0482f5SStefano Zampini ierr = PetscLayoutGetRange(rmap,&rst,&ren);CHKERRQ(ierr); 86511e0482f5SStefano Zampini } 8652e07686f2SStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)A),ren-rst,rst,1,&rows);CHKERRQ(ierr); 86537dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,rows,NULL,MAT_INITIAL_MATRIX,&At);CHKERRQ(ierr); 86541e0482f5SStefano Zampini ierr = ISDestroy(&rows);CHKERRQ(ierr); 86551e0482f5SStefano Zampini 86561e0482f5SStefano Zampini if (ccomm != MPI_COMM_NULL) { 86571e0482f5SStefano Zampini Mat_MPIAIJ *a,*b; 86581e0482f5SStefano Zampini IS from,to; 86591e0482f5SStefano Zampini Vec gvec; 86601e0482f5SStefano Zampini PetscInt lsize; 86611e0482f5SStefano Zampini 86621e0482f5SStefano Zampini ierr = MatCreate(ccomm,B);CHKERRQ(ierr); 86631e0482f5SStefano Zampini ierr = MatSetSizes(*B,ren-rst,PETSC_DECIDE,PETSC_DECIDE,At->cmap->N);CHKERRQ(ierr); 86641e0482f5SStefano Zampini ierr = MatSetType(*B,MATAIJ);CHKERRQ(ierr); 86651e0482f5SStefano Zampini ierr = PetscLayoutDestroy(&((*B)->rmap));CHKERRQ(ierr); 86661e0482f5SStefano Zampini ierr = PetscLayoutSetUp((*B)->cmap);CHKERRQ(ierr); 86671e0482f5SStefano Zampini a = (Mat_MPIAIJ*)At->data; 86681e0482f5SStefano Zampini b = (Mat_MPIAIJ*)(*B)->data; 86691e0482f5SStefano Zampini ierr = MPI_Comm_size(ccomm,&b->size);CHKERRQ(ierr); 86701e0482f5SStefano Zampini ierr = MPI_Comm_rank(ccomm,&b->rank);CHKERRQ(ierr); 86711e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)a->A);CHKERRQ(ierr); 86721e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)a->B);CHKERRQ(ierr); 86731e0482f5SStefano Zampini b->A = a->A; 86741e0482f5SStefano Zampini b->B = a->B; 86751e0482f5SStefano Zampini 86761e0482f5SStefano Zampini b->donotstash = a->donotstash; 86771e0482f5SStefano Zampini b->roworiented = a->roworiented; 86781e0482f5SStefano Zampini b->rowindices = 0; 86791e0482f5SStefano Zampini b->rowvalues = 0; 86801e0482f5SStefano Zampini b->getrowactive = PETSC_FALSE; 86811e0482f5SStefano Zampini 86821e0482f5SStefano Zampini (*B)->rmap = rmap; 86831e0482f5SStefano Zampini (*B)->factortype = A->factortype; 86841e0482f5SStefano Zampini (*B)->assembled = PETSC_TRUE; 86851e0482f5SStefano Zampini (*B)->insertmode = NOT_SET_VALUES; 86861e0482f5SStefano Zampini (*B)->preallocated = PETSC_TRUE; 86871e0482f5SStefano Zampini 86881e0482f5SStefano Zampini if (a->colmap) { 86891e0482f5SStefano Zampini #if defined(PETSC_USE_CTABLE) 86901e0482f5SStefano Zampini ierr = PetscTableCreateCopy(a->colmap,&b->colmap);CHKERRQ(ierr); 86911e0482f5SStefano Zampini #else 86921e0482f5SStefano Zampini ierr = PetscMalloc1(At->cmap->N,&b->colmap);CHKERRQ(ierr); 86931e0482f5SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)*B,At->cmap->N*sizeof(PetscInt));CHKERRQ(ierr); 86941e0482f5SStefano Zampini ierr = PetscMemcpy(b->colmap,a->colmap,At->cmap->N*sizeof(PetscInt));CHKERRQ(ierr); 86951e0482f5SStefano Zampini #endif 86961e0482f5SStefano Zampini } else b->colmap = 0; 86971e0482f5SStefano Zampini if (a->garray) { 86981e0482f5SStefano Zampini PetscInt len; 86991e0482f5SStefano Zampini len = a->B->cmap->n; 87001e0482f5SStefano Zampini ierr = PetscMalloc1(len+1,&b->garray);CHKERRQ(ierr); 87011e0482f5SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)(*B),len*sizeof(PetscInt));CHKERRQ(ierr); 87021e0482f5SStefano Zampini if (len) { ierr = PetscMemcpy(b->garray,a->garray,len*sizeof(PetscInt));CHKERRQ(ierr); } 87031e0482f5SStefano Zampini } else b->garray = 0; 87041e0482f5SStefano Zampini 87051e0482f5SStefano Zampini ierr = PetscObjectReference((PetscObject)a->lvec);CHKERRQ(ierr); 87061e0482f5SStefano Zampini b->lvec = a->lvec; 87071e0482f5SStefano Zampini ierr = PetscLogObjectParent((PetscObject)*B,(PetscObject)b->lvec);CHKERRQ(ierr); 87081e0482f5SStefano Zampini 87091e0482f5SStefano Zampini /* cannot use VecScatterCopy */ 87101e0482f5SStefano Zampini ierr = VecGetLocalSize(b->lvec,&lsize);CHKERRQ(ierr); 87111e0482f5SStefano Zampini ierr = ISCreateGeneral(ccomm,lsize,b->garray,PETSC_USE_POINTER,&from);CHKERRQ(ierr); 87121e0482f5SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,lsize,0,1,&to);CHKERRQ(ierr); 87131e0482f5SStefano Zampini ierr = MatCreateVecs(*B,&gvec,NULL);CHKERRQ(ierr); 87141e0482f5SStefano Zampini ierr = VecScatterCreate(gvec,from,b->lvec,to,&b->Mvctx);CHKERRQ(ierr); 87151e0482f5SStefano Zampini ierr = PetscLogObjectParent((PetscObject)*B,(PetscObject)b->Mvctx);CHKERRQ(ierr); 87161e0482f5SStefano Zampini ierr = ISDestroy(&from);CHKERRQ(ierr); 87171e0482f5SStefano Zampini ierr = ISDestroy(&to);CHKERRQ(ierr); 87181e0482f5SStefano Zampini ierr = VecDestroy(&gvec);CHKERRQ(ierr); 87191e0482f5SStefano Zampini } 87201e0482f5SStefano Zampini ierr = MatDestroy(&At);CHKERRQ(ierr); 87211e0482f5SStefano Zampini PetscFunctionReturn(0); 87221e0482f5SStefano Zampini } 8723