1ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddc.h> 2ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddcprivate.h> 3*25d06dbeSstefano_zampini #include <petscblaslapack.h> 4*25d06dbeSstefano_zampini 5*25d06dbeSstefano_zampini #undef __FUNCT__ 6*25d06dbeSstefano_zampini #define __FUNCT__ "MatMult_BDdelta_deluxe_nonred" 7*25d06dbeSstefano_zampini static PetscErrorCode MatMult_BDdelta_deluxe_nonred(Mat A, Vec x, Vec y) 8*25d06dbeSstefano_zampini { 9*25d06dbeSstefano_zampini BDdelta_DN ctx; 10*25d06dbeSstefano_zampini PetscErrorCode ierr; 11*25d06dbeSstefano_zampini 12*25d06dbeSstefano_zampini PetscFunctionBegin; 13*25d06dbeSstefano_zampini ierr = MatShellGetContext(A,(void**)&ctx);CHKERRQ(ierr); 14*25d06dbeSstefano_zampini ierr = MatMultTranspose(ctx->BD,x,ctx->work);CHKERRQ(ierr); 15*25d06dbeSstefano_zampini ierr = KSPSolveTranspose(ctx->kBD,ctx->work,y);CHKERRQ(ierr); 16*25d06dbeSstefano_zampini PetscFunctionReturn(0); 17*25d06dbeSstefano_zampini } 18*25d06dbeSstefano_zampini 19*25d06dbeSstefano_zampini #undef __FUNCT__ 20*25d06dbeSstefano_zampini #define __FUNCT__ "MatMultTranspose_BDdelta_deluxe_nonred" 21*25d06dbeSstefano_zampini static PetscErrorCode MatMultTranspose_BDdelta_deluxe_nonred(Mat A, Vec x, Vec y) 22*25d06dbeSstefano_zampini { 23*25d06dbeSstefano_zampini BDdelta_DN ctx; 24*25d06dbeSstefano_zampini PetscErrorCode ierr; 25*25d06dbeSstefano_zampini 26*25d06dbeSstefano_zampini PetscFunctionBegin; 27*25d06dbeSstefano_zampini ierr = MatShellGetContext(A,(void**)&ctx);CHKERRQ(ierr); 28*25d06dbeSstefano_zampini ierr = KSPSolve(ctx->kBD,x,ctx->work);CHKERRQ(ierr); 29*25d06dbeSstefano_zampini ierr = MatMult(ctx->BD,ctx->work,y);CHKERRQ(ierr); 30*25d06dbeSstefano_zampini PetscFunctionReturn(0); 31*25d06dbeSstefano_zampini } 32*25d06dbeSstefano_zampini 33*25d06dbeSstefano_zampini #undef __FUNCT__ 34*25d06dbeSstefano_zampini #define __FUNCT__ "MatDestroy_BDdelta_deluxe_nonred" 35*25d06dbeSstefano_zampini static PetscErrorCode MatDestroy_BDdelta_deluxe_nonred(Mat A) 36*25d06dbeSstefano_zampini { 37*25d06dbeSstefano_zampini BDdelta_DN ctx; 38*25d06dbeSstefano_zampini PetscErrorCode ierr; 39*25d06dbeSstefano_zampini 40*25d06dbeSstefano_zampini PetscFunctionBegin; 41*25d06dbeSstefano_zampini ierr = MatShellGetContext(A,(void**)&ctx);CHKERRQ(ierr); 42*25d06dbeSstefano_zampini ierr = MatDestroy(&ctx->BD);CHKERRQ(ierr); 43*25d06dbeSstefano_zampini ierr = KSPDestroy(&ctx->kBD);CHKERRQ(ierr); 44*25d06dbeSstefano_zampini ierr = VecDestroy(&ctx->work);CHKERRQ(ierr); 45*25d06dbeSstefano_zampini ierr = PetscFree(ctx);CHKERRQ(ierr); 46*25d06dbeSstefano_zampini PetscFunctionReturn(0); 47*25d06dbeSstefano_zampini } 48*25d06dbeSstefano_zampini 49674ae819SStefano Zampini 50674ae819SStefano Zampini #undef __FUNCT__ 51674ae819SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext" 52674ae819SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx *fetidpmat_ctx) 53674ae819SStefano Zampini { 54674ae819SStefano Zampini FETIDPMat_ctx newctx; 55674ae819SStefano Zampini PetscErrorCode ierr; 56674ae819SStefano Zampini 57674ae819SStefano Zampini PetscFunctionBegin; 58854ce69bSBarry Smith ierr = PetscNew(&newctx);CHKERRQ(ierr); 59674ae819SStefano Zampini /* increase the reference count for BDDC preconditioner */ 60674ae819SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 61674ae819SStefano Zampini newctx->pc = pc; 62674ae819SStefano Zampini *fetidpmat_ctx = newctx; 63674ae819SStefano Zampini PetscFunctionReturn(0); 64674ae819SStefano Zampini } 65674ae819SStefano Zampini 66674ae819SStefano Zampini #undef __FUNCT__ 67674ae819SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext" 68674ae819SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx *fetidppc_ctx) 69674ae819SStefano Zampini { 70674ae819SStefano Zampini FETIDPPC_ctx newctx; 71674ae819SStefano Zampini PetscErrorCode ierr; 72674ae819SStefano Zampini 73674ae819SStefano Zampini PetscFunctionBegin; 74854ce69bSBarry Smith ierr = PetscNew(&newctx);CHKERRQ(ierr); 75674ae819SStefano Zampini /* increase the reference count for BDDC preconditioner */ 76674ae819SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 77674ae819SStefano Zampini newctx->pc = pc; 78674ae819SStefano Zampini *fetidppc_ctx = newctx; 79674ae819SStefano Zampini PetscFunctionReturn(0); 80674ae819SStefano Zampini } 81674ae819SStefano Zampini 82674ae819SStefano Zampini #undef __FUNCT__ 83674ae819SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat" 84674ae819SStefano Zampini PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A) 85674ae819SStefano Zampini { 86674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 87674ae819SStefano Zampini PetscErrorCode ierr; 88674ae819SStefano Zampini 89674ae819SStefano Zampini PetscFunctionBegin; 90674ae819SStefano Zampini ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr); 91674ae819SStefano Zampini ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr); 92674ae819SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr); 93674ae819SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr); 94674ae819SStefano Zampini ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr); 95674ae819SStefano Zampini ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr); 96457d4a33Sstefano_zampini ierr = MatDestroy(&mat_ctx->B_BB);CHKERRQ(ierr); 97457d4a33Sstefano_zampini ierr = MatDestroy(&mat_ctx->B_BI);CHKERRQ(ierr); 98457d4a33Sstefano_zampini ierr = MatDestroy(&mat_ctx->Bt_BB);CHKERRQ(ierr); 99457d4a33Sstefano_zampini ierr = MatDestroy(&mat_ctx->Bt_BI);CHKERRQ(ierr); 100457d4a33Sstefano_zampini ierr = MatDestroy(&mat_ctx->C);CHKERRQ(ierr); 1016cc1294bSstefano_zampini ierr = VecDestroy(&mat_ctx->rhs_flip);CHKERRQ(ierr); 102457d4a33Sstefano_zampini ierr = VecDestroy(&mat_ctx->vP);CHKERRQ(ierr); 103457d4a33Sstefano_zampini ierr = VecDestroy(&mat_ctx->xPg);CHKERRQ(ierr); 104457d4a33Sstefano_zampini ierr = VecDestroy(&mat_ctx->yPg);CHKERRQ(ierr); 105674ae819SStefano Zampini ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr); 106457d4a33Sstefano_zampini ierr = VecScatterDestroy(&mat_ctx->l2g_p);CHKERRQ(ierr); 1079cc7774eSstefano_zampini ierr = VecScatterDestroy(&mat_ctx->g2g_p);CHKERRQ(ierr); 108674ae819SStefano Zampini ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* decrease PCBDDC reference count */ 109674ae819SStefano Zampini ierr = PetscFree(mat_ctx);CHKERRQ(ierr); 110674ae819SStefano Zampini PetscFunctionReturn(0); 111674ae819SStefano Zampini } 112674ae819SStefano Zampini 113674ae819SStefano Zampini #undef __FUNCT__ 114674ae819SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC" 115674ae819SStefano Zampini PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc) 116674ae819SStefano Zampini { 117674ae819SStefano Zampini FETIDPPC_ctx pc_ctx; 118674ae819SStefano Zampini PetscErrorCode ierr; 119674ae819SStefano Zampini 120674ae819SStefano Zampini PetscFunctionBegin; 121674ae819SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 122674ae819SStefano Zampini ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr); 123674ae819SStefano Zampini ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr); 124674ae819SStefano Zampini ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr); 12568668abeSStefano Zampini ierr = MatDestroy(&pc_ctx->S_j);CHKERRQ(ierr); 126674ae819SStefano Zampini ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* decrease PCBDDC reference count */ 127457d4a33Sstefano_zampini ierr = KSPDestroy(&pc_ctx->kP);CHKERRQ(ierr); 128457d4a33Sstefano_zampini ierr = VecDestroy(&pc_ctx->xPg);CHKERRQ(ierr); 129457d4a33Sstefano_zampini ierr = VecDestroy(&pc_ctx->yPg);CHKERRQ(ierr); 130674ae819SStefano Zampini ierr = PetscFree(pc_ctx);CHKERRQ(ierr); 131674ae819SStefano Zampini PetscFunctionReturn(0); 132674ae819SStefano Zampini } 133674ae819SStefano Zampini 134674ae819SStefano Zampini #undef __FUNCT__ 135674ae819SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext" 136674ae819SStefano Zampini PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx fetidpmat_ctx ) 137674ae819SStefano Zampini { 138674ae819SStefano Zampini PetscErrorCode ierr; 139674ae819SStefano Zampini PC_IS *pcis=(PC_IS*)fetidpmat_ctx->pc->data; 140674ae819SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data; 141674ae819SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 142674ae819SStefano Zampini Mat_IS *matis = (Mat_IS*)fetidpmat_ctx->pc->pmat->data; 143674ae819SStefano Zampini MPI_Comm comm; 144*25d06dbeSstefano_zampini Mat ScalingMat,BD1,BD2; 145457d4a33Sstefano_zampini Vec fetidp_global; 146674ae819SStefano Zampini IS IS_l2g_lambda; 147a1c0d0daSstefano_zampini IS subset,subset_mult,subset_n,isvert; 148674ae819SStefano Zampini PetscBool skip_node,fully_redundant; 149674ae819SStefano Zampini PetscInt i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum; 150dc456d91SStefano Zampini PetscInt cum,n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values; 15176ec1555SBarry Smith PetscMPIInt rank,size,buf_size,neigh; 152674ae819SStefano Zampini PetscScalar scalar_value; 153a1c0d0daSstefano_zampini const PetscInt *vertex_indices; 154dc456d91SStefano Zampini PetscInt *dual_dofs_boundary_indices,*aux_local_numbering_1; 155dc456d91SStefano Zampini const PetscInt *aux_global_numbering; 156674ae819SStefano Zampini PetscInt *aux_sums,*cols_B_delta,*l2g_indices; 157674ae819SStefano Zampini PetscScalar *array,*scaling_factors,*vals_B_delta; 158*25d06dbeSstefano_zampini PetscScalar **all_factors; 159674ae819SStefano Zampini PetscInt *aux_local_numbering_2; 160457d4a33Sstefano_zampini PetscLayout llay; 161a1c0d0daSstefano_zampini 162457d4a33Sstefano_zampini /* saddlepoint */ 163457d4a33Sstefano_zampini ISLocalToGlobalMapping l2gmap_p; 164457d4a33Sstefano_zampini PetscLayout play; 165457d4a33Sstefano_zampini IS gP,pP; 166457d4a33Sstefano_zampini PetscInt nPl,nPg,nPgl; 167674ae819SStefano Zampini 168674ae819SStefano Zampini PetscFunctionBegin; 169674ae819SStefano Zampini ierr = PetscObjectGetComm((PetscObject)(fetidpmat_ctx->pc),&comm);CHKERRQ(ierr); 170674ae819SStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 17176ec1555SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 172674ae819SStefano Zampini 173457d4a33Sstefano_zampini /* saddlepoint */ 174457d4a33Sstefano_zampini nPl = 0; 175457d4a33Sstefano_zampini nPg = 0; 176457d4a33Sstefano_zampini nPgl = 0; 177457d4a33Sstefano_zampini gP = NULL; 178457d4a33Sstefano_zampini pP = NULL; 179457d4a33Sstefano_zampini l2gmap_p = NULL; 180457d4a33Sstefano_zampini play = NULL; 181457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_pP",(PetscObject*)&pP);CHKERRQ(ierr); 182022d8d2bSstefano_zampini if (pP) { /* saddle point */ 183457d4a33Sstefano_zampini /* subdomain pressures in global numbering */ 184457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_gP",(PetscObject*)&gP);CHKERRQ(ierr); 185457d4a33Sstefano_zampini if (!gP) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"gP not present"); 186457d4a33Sstefano_zampini ierr = ISGetLocalSize(gP,&nPl);CHKERRQ(ierr); 187457d4a33Sstefano_zampini ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->vP);CHKERRQ(ierr); 188457d4a33Sstefano_zampini ierr = VecSetSizes(fetidpmat_ctx->vP,nPl,nPl);CHKERRQ(ierr); 189457d4a33Sstefano_zampini ierr = VecSetType(fetidpmat_ctx->vP,VECSTANDARD);CHKERRQ(ierr); 190457d4a33Sstefano_zampini ierr = VecSetUp(fetidpmat_ctx->vP);CHKERRQ(ierr); 191457d4a33Sstefano_zampini 192457d4a33Sstefano_zampini /* interface pressure matrix */ 193457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_C",(PetscObject*)&fetidpmat_ctx->C);CHKERRQ(ierr); 194457d4a33Sstefano_zampini if (!fetidpmat_ctx->C) { /* null pressure block, compute layout and global numbering for interface pressures */ 195457d4a33Sstefano_zampini IS Pg; 196457d4a33Sstefano_zampini 197457d4a33Sstefano_zampini ierr = ISRenumber(gP,NULL,&nPg,&Pg);CHKERRQ(ierr); 198457d4a33Sstefano_zampini ierr = ISLocalToGlobalMappingCreateIS(Pg,&l2gmap_p);CHKERRQ(ierr); 199457d4a33Sstefano_zampini ierr = ISDestroy(&Pg);CHKERRQ(ierr); 200457d4a33Sstefano_zampini ierr = PetscLayoutCreate(comm,&play);CHKERRQ(ierr); 201457d4a33Sstefano_zampini ierr = PetscLayoutSetBlockSize(play,1);CHKERRQ(ierr); 202457d4a33Sstefano_zampini ierr = PetscLayoutSetSize(play,nPg);CHKERRQ(ierr); 203457d4a33Sstefano_zampini ierr = ISGetLocalSize(pP,&nPgl);CHKERRQ(ierr); 204457d4a33Sstefano_zampini ierr = PetscLayoutSetLocalSize(play,nPgl);CHKERRQ(ierr); 205457d4a33Sstefano_zampini ierr = PetscLayoutSetUp(play);CHKERRQ(ierr); 206457d4a33Sstefano_zampini } else { 207457d4a33Sstefano_zampini ierr = PetscObjectReference((PetscObject)fetidpmat_ctx->C);CHKERRQ(ierr); 208457d4a33Sstefano_zampini ierr = MatGetLocalToGlobalMapping(fetidpmat_ctx->C,&l2gmap_p,NULL);CHKERRQ(ierr); 209457d4a33Sstefano_zampini ierr = PetscObjectReference((PetscObject)l2gmap_p);CHKERRQ(ierr); 210457d4a33Sstefano_zampini ierr = MatGetSize(fetidpmat_ctx->C,&nPg,NULL);CHKERRQ(ierr); 211457d4a33Sstefano_zampini ierr = MatGetLocalSize(fetidpmat_ctx->C,NULL,&nPgl);CHKERRQ(ierr); 212457d4a33Sstefano_zampini ierr = MatGetLayouts(fetidpmat_ctx->C,NULL,&llay);CHKERRQ(ierr); 213457d4a33Sstefano_zampini ierr = PetscLayoutReference(llay,&play);CHKERRQ(ierr); 214457d4a33Sstefano_zampini } 215457d4a33Sstefano_zampini ierr = VecCreateMPIWithArray(comm,1,nPgl,nPg,NULL,&fetidpmat_ctx->xPg);CHKERRQ(ierr); 216457d4a33Sstefano_zampini ierr = VecCreateMPIWithArray(comm,1,nPgl,nPg,NULL,&fetidpmat_ctx->yPg);CHKERRQ(ierr); 217457d4a33Sstefano_zampini 218457d4a33Sstefano_zampini /* import matrices for interface pressures coupling */ 219457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_B_BI",(PetscObject*)&fetidpmat_ctx->B_BI);CHKERRQ(ierr); 220457d4a33Sstefano_zampini if (!fetidpmat_ctx->B_BI) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"B_BI not present"); 221457d4a33Sstefano_zampini ierr = PetscObjectReference((PetscObject)fetidpmat_ctx->B_BI);CHKERRQ(ierr); 222457d4a33Sstefano_zampini 223457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_B_BB",(PetscObject*)&fetidpmat_ctx->B_BB);CHKERRQ(ierr); 224457d4a33Sstefano_zampini if (!fetidpmat_ctx->B_BB) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"B_BB not present"); 225457d4a33Sstefano_zampini ierr = PetscObjectReference((PetscObject)fetidpmat_ctx->B_BB);CHKERRQ(ierr); 226457d4a33Sstefano_zampini 227457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_Bt_BI",(PetscObject*)&fetidpmat_ctx->Bt_BI);CHKERRQ(ierr); 228457d4a33Sstefano_zampini if (!fetidpmat_ctx->Bt_BI) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Bt_BI not present"); 229457d4a33Sstefano_zampini ierr = PetscObjectReference((PetscObject)fetidpmat_ctx->Bt_BI);CHKERRQ(ierr); 230457d4a33Sstefano_zampini 231457d4a33Sstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_Bt_BB",(PetscObject*)&fetidpmat_ctx->Bt_BB);CHKERRQ(ierr); 232457d4a33Sstefano_zampini if (!fetidpmat_ctx->Bt_BB) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Bt_BB not present"); 233457d4a33Sstefano_zampini ierr = PetscObjectReference((PetscObject)fetidpmat_ctx->Bt_BB);CHKERRQ(ierr); 2346cc1294bSstefano_zampini 2356cc1294bSstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidpmat_ctx->pc,"__KSPFETIDP_flip" ,(PetscObject*)&fetidpmat_ctx->rhs_flip);CHKERRQ(ierr); 2366cc1294bSstefano_zampini if (fetidpmat_ctx->rhs_flip) { 2376cc1294bSstefano_zampini ierr = PetscObjectReference((PetscObject)fetidpmat_ctx->rhs_flip);CHKERRQ(ierr); 2386cc1294bSstefano_zampini } 239457d4a33Sstefano_zampini } 240457d4a33Sstefano_zampini 241674ae819SStefano Zampini /* Default type of lagrange multipliers is non-redundant */ 242329cd39dSStefano Zampini fully_redundant = fetidpmat_ctx->fully_redundant; 243674ae819SStefano Zampini 244674ae819SStefano Zampini /* Evaluate local and global number of lagrange multipliers */ 245674ae819SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 246674ae819SStefano Zampini n_local_lambda = 0; 247674ae819SStefano Zampini partial_sum = 0; 248674ae819SStefano Zampini n_boundary_dofs = 0; 249674ae819SStefano Zampini s = 0; 250a1c0d0daSstefano_zampini 251674ae819SStefano Zampini /* Get Vertices used to define the BDDC */ 252a1c0d0daSstefano_zampini ierr = PCBDDCGraphGetCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&isvert);CHKERRQ(ierr); 253a1c0d0daSstefano_zampini ierr = ISGetLocalSize(isvert,&n_vertices);CHKERRQ(ierr); 254a1c0d0daSstefano_zampini ierr = ISGetIndices(isvert,&vertex_indices);CHKERRQ(ierr); 255a1c0d0daSstefano_zampini 256674ae819SStefano Zampini dual_size = pcis->n_B-n_vertices; 257785e854fSJed Brown ierr = PetscMalloc1(dual_size,&dual_dofs_boundary_indices);CHKERRQ(ierr); 258785e854fSJed Brown ierr = PetscMalloc1(dual_size,&aux_local_numbering_1);CHKERRQ(ierr); 259785e854fSJed Brown ierr = PetscMalloc1(dual_size,&aux_local_numbering_2);CHKERRQ(ierr); 260674ae819SStefano Zampini 261674ae819SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 262674ae819SStefano Zampini for (i=0;i<pcis->n;i++){ 263674ae819SStefano Zampini j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */ 2642d456bbaSstefano_zampini if (j > 0) n_boundary_dofs++; 265674ae819SStefano Zampini skip_node = PETSC_FALSE; 266674ae819SStefano Zampini if (s < n_vertices && vertex_indices[s] == i) { /* it works for a sorted set of vertices */ 267674ae819SStefano Zampini skip_node = PETSC_TRUE; 268674ae819SStefano Zampini s++; 269674ae819SStefano Zampini } 2702d456bbaSstefano_zampini if (j < 1) skip_node = PETSC_TRUE; 2712d456bbaSstefano_zampini if (mat_graph->special_dof[i] == PCBDDCGRAPH_DIRICHLET_MARK) skip_node = PETSC_TRUE; 272674ae819SStefano Zampini if (!skip_node) { 273674ae819SStefano Zampini if (fully_redundant) { 274674ae819SStefano Zampini /* fully redundant set of lagrange multipliers */ 275674ae819SStefano Zampini n_lambda_for_dof = (j*(j+1))/2; 276674ae819SStefano Zampini } else { 277674ae819SStefano Zampini n_lambda_for_dof = j; 278674ae819SStefano Zampini } 279674ae819SStefano Zampini n_local_lambda += j; 280674ae819SStefano Zampini /* needed to evaluate global number of lagrange multipliers */ 281674ae819SStefano Zampini array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */ 282674ae819SStefano Zampini /* store some data needed */ 283674ae819SStefano Zampini dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1; 284674ae819SStefano Zampini aux_local_numbering_1[partial_sum] = i; 285674ae819SStefano Zampini aux_local_numbering_2[partial_sum] = n_lambda_for_dof; 286674ae819SStefano Zampini partial_sum++; 287674ae819SStefano Zampini } 288674ae819SStefano Zampini } 289674ae819SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 290a1c0d0daSstefano_zampini ierr = ISRestoreIndices(isvert,&vertex_indices);CHKERRQ(ierr); 291a1c0d0daSstefano_zampini ierr = PCBDDCGraphRestoreCandidatesIS(pcbddc->mat_graph,NULL,NULL,NULL,NULL,&isvert);CHKERRQ(ierr); 2922d456bbaSstefano_zampini dual_size = partial_sum; 293674ae819SStefano Zampini 294674ae819SStefano Zampini /* compute global ordering of lagrange multipliers and associate l2g map */ 295dc456d91SStefano Zampini ierr = ISCreateGeneral(comm,partial_sum,aux_local_numbering_1,PETSC_COPY_VALUES,&subset_n);CHKERRQ(ierr); 2963bbff08aSStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(pcis->mapping,subset_n,&subset);CHKERRQ(ierr); 297dc456d91SStefano Zampini ierr = ISDestroy(&subset_n);CHKERRQ(ierr); 298dc456d91SStefano Zampini ierr = ISCreateGeneral(comm,partial_sum,aux_local_numbering_2,PETSC_OWN_POINTER,&subset_mult);CHKERRQ(ierr); 2993d996552SStefano Zampini ierr = ISRenumber(subset,subset_mult,&fetidpmat_ctx->n_lambda,&subset_n);CHKERRQ(ierr); 300dc456d91SStefano Zampini ierr = ISDestroy(&subset);CHKERRQ(ierr); 3013d996552SStefano Zampini 3024fe826edSStefano Zampini #if defined(PETSC_USE_DEBUG) 3034fe826edSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3044fe826edSStefano Zampini ierr = VecScatterBegin(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3054fe826edSStefano Zampini ierr = VecScatterEnd(matis->rctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3064fe826edSStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 3074fe826edSStefano Zampini i = (PetscInt)PetscRealPart(scalar_value); 3086c4ed002SBarry Smith if (i != fetidpmat_ctx->n_lambda) SETERRQ2(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Global number of multipliers mismatch! (%d!=%d)\n",fetidpmat_ctx->n_lambda,i); 3094fe826edSStefano Zampini #endif 310674ae819SStefano Zampini 311674ae819SStefano Zampini /* init data for scaling factors exchange */ 312*25d06dbeSstefano_zampini if (!pcbddc->use_deluxe_scaling) { 313*25d06dbeSstefano_zampini PetscInt *ptrs_buffer,neigh_position; 314*25d06dbeSstefano_zampini PetscScalar *send_buffer,*recv_buffer; 315*25d06dbeSstefano_zampini MPI_Request *send_reqs,*recv_reqs; 316*25d06dbeSstefano_zampini 317674ae819SStefano Zampini partial_sum = 0; 318785e854fSJed Brown ierr = PetscMalloc1(pcis->n_neigh,&ptrs_buffer);CHKERRQ(ierr); 3194b2aedd3SStefano Zampini ierr = PetscMalloc1(PetscMax(pcis->n_neigh-1,0),&send_reqs);CHKERRQ(ierr); 3204b2aedd3SStefano Zampini ierr = PetscMalloc1(PetscMax(pcis->n_neigh-1,0),&recv_reqs);CHKERRQ(ierr); 32119c16490Sstefano_zampini ierr = PetscMalloc1(pcis->n+1,&all_factors);CHKERRQ(ierr); 3224b2aedd3SStefano Zampini if (pcis->n_neigh > 0) ptrs_buffer[0]=0; 323674ae819SStefano Zampini for (i=1;i<pcis->n_neigh;i++) { 324674ae819SStefano Zampini partial_sum += pcis->n_shared[i]; 325674ae819SStefano Zampini ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i]; 326674ae819SStefano Zampini } 327785e854fSJed Brown ierr = PetscMalloc1(partial_sum,&send_buffer);CHKERRQ(ierr); 328785e854fSJed Brown ierr = PetscMalloc1(partial_sum,&recv_buffer);CHKERRQ(ierr); 329785e854fSJed Brown ierr = PetscMalloc1(partial_sum,&all_factors[0]);CHKERRQ(ierr); 330674ae819SStefano Zampini for (i=0;i<pcis->n-1;i++) { 331674ae819SStefano Zampini j = mat_graph->count[i]; 332674ae819SStefano Zampini all_factors[i+1]=all_factors[i]+j; 333674ae819SStefano Zampini } 334*25d06dbeSstefano_zampini 335674ae819SStefano Zampini /* scatter B scaling to N vec */ 336674ae819SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 337674ae819SStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 338674ae819SStefano Zampini /* communications */ 3392b095fd8SStefano Zampini ierr = VecGetArrayRead(pcis->vec1_N,(const PetscScalar**)&array);CHKERRQ(ierr); 340674ae819SStefano Zampini for (i=1;i<pcis->n_neigh;i++) { 341674ae819SStefano Zampini for (j=0;j<pcis->n_shared[i];j++) { 342674ae819SStefano Zampini send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]]; 343674ae819SStefano Zampini } 344674ae819SStefano Zampini ierr = PetscMPIIntCast(ptrs_buffer[i]-ptrs_buffer[i-1],&buf_size);CHKERRQ(ierr); 345674ae819SStefano Zampini ierr = PetscMPIIntCast(pcis->neigh[i],&neigh);CHKERRQ(ierr); 346674ae819SStefano Zampini ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],buf_size,MPIU_SCALAR,neigh,0,comm,&send_reqs[i-1]);CHKERRQ(ierr); 347674ae819SStefano Zampini ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],buf_size,MPIU_SCALAR,neigh,0,comm,&recv_reqs[i-1]);CHKERRQ(ierr); 348674ae819SStefano Zampini } 3492b095fd8SStefano Zampini ierr = VecRestoreArrayRead(pcis->vec1_N,(const PetscScalar**)&array);CHKERRQ(ierr); 3504b2aedd3SStefano Zampini if (pcis->n_neigh > 0) { 3514b2aedd3SStefano Zampini ierr = MPI_Waitall(pcis->n_neigh-1,recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3524b2aedd3SStefano Zampini } 353674ae819SStefano Zampini /* put values in correct places */ 354674ae819SStefano Zampini for (i=1;i<pcis->n_neigh;i++) { 355674ae819SStefano Zampini for (j=0;j<pcis->n_shared[i];j++) { 356674ae819SStefano Zampini k = pcis->shared[i][j]; 357674ae819SStefano Zampini neigh_position = 0; 358674ae819SStefano Zampini while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;} 359674ae819SStefano Zampini all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j]; 360674ae819SStefano Zampini } 361674ae819SStefano Zampini } 3624b2aedd3SStefano Zampini if (pcis->n_neigh > 0) { 3634b2aedd3SStefano Zampini ierr = MPI_Waitall(pcis->n_neigh-1,send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3644b2aedd3SStefano Zampini } 365674ae819SStefano Zampini ierr = PetscFree(send_reqs);CHKERRQ(ierr); 366674ae819SStefano Zampini ierr = PetscFree(recv_reqs);CHKERRQ(ierr); 367674ae819SStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 368674ae819SStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 369674ae819SStefano Zampini ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr); 370*25d06dbeSstefano_zampini } 371674ae819SStefano Zampini 372674ae819SStefano Zampini /* Compute B and B_delta (local actions) */ 373785e854fSJed Brown ierr = PetscMalloc1(pcis->n_neigh,&aux_sums);CHKERRQ(ierr); 374785e854fSJed Brown ierr = PetscMalloc1(n_local_lambda,&l2g_indices);CHKERRQ(ierr); 375785e854fSJed Brown ierr = PetscMalloc1(n_local_lambda,&vals_B_delta);CHKERRQ(ierr); 376785e854fSJed Brown ierr = PetscMalloc1(n_local_lambda,&cols_B_delta);CHKERRQ(ierr); 377*25d06dbeSstefano_zampini if (!pcbddc->use_deluxe_scaling) { 378785e854fSJed Brown ierr = PetscMalloc1(n_local_lambda,&scaling_factors);CHKERRQ(ierr); 379*25d06dbeSstefano_zampini } else { 380*25d06dbeSstefano_zampini scaling_factors = NULL; 381*25d06dbeSstefano_zampini all_factors = NULL; 382*25d06dbeSstefano_zampini } 383dc456d91SStefano Zampini ierr = ISGetIndices(subset_n,&aux_global_numbering);CHKERRQ(ierr); 384674ae819SStefano Zampini partial_sum=0; 385dc456d91SStefano Zampini cum = 0; 386674ae819SStefano Zampini for (i=0;i<dual_size;i++) { 387dc456d91SStefano Zampini n_global_lambda = aux_global_numbering[cum]; 388674ae819SStefano Zampini j = mat_graph->count[aux_local_numbering_1[i]]; 389674ae819SStefano Zampini aux_sums[0]=0; 390674ae819SStefano Zampini for (s=1;s<j;s++) { 391674ae819SStefano Zampini aux_sums[s]=aux_sums[s-1]+j-s+1; 392674ae819SStefano Zampini } 393*25d06dbeSstefano_zampini if (all_factors) array = all_factors[aux_local_numbering_1[i]]; 394674ae819SStefano Zampini n_neg_values = 0; 3952a7da448SStefano Zampini while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values] < rank) {n_neg_values++;} 396674ae819SStefano Zampini n_pos_values = j - n_neg_values; 397674ae819SStefano Zampini if (fully_redundant) { 398674ae819SStefano Zampini for (s=0;s<n_neg_values;s++) { 399674ae819SStefano Zampini l2g_indices [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda; 400674ae819SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 401674ae819SStefano Zampini vals_B_delta [partial_sum+s]=-1.0; 402*25d06dbeSstefano_zampini if (!pcbddc->use_deluxe_scaling) scaling_factors[partial_sum+s]=array[s]; 403674ae819SStefano Zampini } 404674ae819SStefano Zampini for (s=0;s<n_pos_values;s++) { 405674ae819SStefano Zampini l2g_indices [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda; 406674ae819SStefano Zampini cols_B_delta [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i]; 407674ae819SStefano Zampini vals_B_delta [partial_sum+s+n_neg_values]=1.0; 408*25d06dbeSstefano_zampini if (!pcbddc->use_deluxe_scaling) scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values]; 409674ae819SStefano Zampini } 410674ae819SStefano Zampini partial_sum += j; 411674ae819SStefano Zampini } else { 412674ae819SStefano Zampini /* l2g_indices and default cols and vals of B_delta */ 413674ae819SStefano Zampini for (s=0;s<j;s++) { 414674ae819SStefano Zampini l2g_indices [partial_sum+s]=n_global_lambda+s; 415674ae819SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 416674ae819SStefano Zampini vals_B_delta [partial_sum+s]=0.0; 417674ae819SStefano Zampini } 418674ae819SStefano Zampini /* B_delta */ 419674ae819SStefano Zampini if ( n_neg_values > 0 ) { /* there's a rank next to me to the left */ 420674ae819SStefano Zampini vals_B_delta [partial_sum+n_neg_values-1]=-1.0; 421674ae819SStefano Zampini } 422674ae819SStefano Zampini if ( n_neg_values < j ) { /* there's a rank next to me to the right */ 423674ae819SStefano Zampini vals_B_delta [partial_sum+n_neg_values]=1.0; 424674ae819SStefano Zampini } 425674ae819SStefano Zampini /* scaling as in Klawonn-Widlund 1999 */ 426*25d06dbeSstefano_zampini if (!pcbddc->use_deluxe_scaling) { 427674ae819SStefano Zampini for (s=0;s<n_neg_values;s++) { 428674ae819SStefano Zampini scalar_value = 0.0; 429*25d06dbeSstefano_zampini for (k=0;k<s+1;k++) scalar_value += array[k]; 430674ae819SStefano Zampini scaling_factors[partial_sum+s] = -scalar_value; 431674ae819SStefano Zampini } 432674ae819SStefano Zampini for (s=0;s<n_pos_values;s++) { 433674ae819SStefano Zampini scalar_value = 0.0; 434*25d06dbeSstefano_zampini for (k=s+n_neg_values;k<j;k++) scalar_value += array[k]; 435674ae819SStefano Zampini scaling_factors[partial_sum+s+n_neg_values] = scalar_value; 436674ae819SStefano Zampini } 437*25d06dbeSstefano_zampini } 438674ae819SStefano Zampini partial_sum += j; 439674ae819SStefano Zampini } 440dc456d91SStefano Zampini cum += aux_local_numbering_2[i]; 441674ae819SStefano Zampini } 442dc456d91SStefano Zampini ierr = ISRestoreIndices(subset_n,&aux_global_numbering);CHKERRQ(ierr); 443dc456d91SStefano Zampini ierr = ISDestroy(&subset_mult);CHKERRQ(ierr); 444dc456d91SStefano Zampini ierr = ISDestroy(&subset_n);CHKERRQ(ierr); 445674ae819SStefano Zampini ierr = PetscFree(aux_sums);CHKERRQ(ierr); 446674ae819SStefano Zampini ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr); 447674ae819SStefano Zampini ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr); 448*25d06dbeSstefano_zampini if (all_factors) { 449674ae819SStefano Zampini ierr = PetscFree(all_factors[0]);CHKERRQ(ierr); 450674ae819SStefano Zampini ierr = PetscFree(all_factors);CHKERRQ(ierr); 451*25d06dbeSstefano_zampini } 452674ae819SStefano Zampini 453674ae819SStefano Zampini /* Create local part of B_delta */ 454302440fdSBarry Smith ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);CHKERRQ(ierr); 455674ae819SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 456674ae819SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr); 457674ae819SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,NULL);CHKERRQ(ierr); 458674ae819SStefano Zampini ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 459674ae819SStefano Zampini for (i=0;i<n_local_lambda;i++) { 460674ae819SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr); 461674ae819SStefano Zampini } 462674ae819SStefano Zampini ierr = PetscFree(vals_B_delta);CHKERRQ(ierr); 463674ae819SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 464674ae819SStefano Zampini ierr = MatAssemblyEnd(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 465674ae819SStefano Zampini 466*25d06dbeSstefano_zampini BD1 = NULL; 467*25d06dbeSstefano_zampini BD2 = NULL; 468674ae819SStefano Zampini if (fully_redundant) { 469*25d06dbeSstefano_zampini if (pcbddc->use_deluxe_scaling) SETERRQ(comm,PETSC_ERR_SUP,"Deluxe FETIDP with fully-redundant multipliers to be implemented"); 470302440fdSBarry Smith ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);CHKERRQ(ierr); 471674ae819SStefano Zampini ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 472674ae819SStefano Zampini ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr); 473674ae819SStefano Zampini ierr = MatSeqAIJSetPreallocation(ScalingMat,1,NULL);CHKERRQ(ierr); 474674ae819SStefano Zampini for (i=0;i<n_local_lambda;i++) { 475674ae819SStefano Zampini ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 476674ae819SStefano Zampini } 477674ae819SStefano Zampini ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 478674ae819SStefano Zampini ierr = MatAssemblyEnd(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 479674ae819SStefano Zampini ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 480674ae819SStefano Zampini ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr); 481674ae819SStefano Zampini } else { 482302440fdSBarry Smith ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 483674ae819SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 484*25d06dbeSstefano_zampini if (!pcbddc->use_deluxe_scaling) { 485674ae819SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr); 486674ae819SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,NULL);CHKERRQ(ierr); 487674ae819SStefano Zampini for (i=0;i<n_local_lambda;i++) { 488674ae819SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 489674ae819SStefano Zampini } 490674ae819SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 491674ae819SStefano Zampini ierr = MatAssemblyEnd(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 492*25d06dbeSstefano_zampini } else { 493*25d06dbeSstefano_zampini /* scaling as in Klawonn-Widlund 1999 */ 494*25d06dbeSstefano_zampini PCBDDCDeluxeScaling deluxe_ctx = pcbddc->deluxe_ctx; 495*25d06dbeSstefano_zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 496*25d06dbeSstefano_zampini Mat T; 497*25d06dbeSstefano_zampini PetscScalar *W,lwork,*Bwork; 498*25d06dbeSstefano_zampini const PetscInt *idxs; 499*25d06dbeSstefano_zampini PetscInt cum,mss,*nnz; 500*25d06dbeSstefano_zampini PetscBLASInt *pivots,B_lwork,B_N,B_ierr; 501*25d06dbeSstefano_zampini 502*25d06dbeSstefano_zampini if (!pcbddc->deluxe_singlemat) SETERRQ(comm,PETSC_ERR_USER,"Cannot compute B_Ddelta! rerun with -pc_bddc_deluxe_singlemat"); 503*25d06dbeSstefano_zampini if (deluxe_ctx->change) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot compute B_Ddelta with deluxe scaling with active change context"); 504*25d06dbeSstefano_zampini 505*25d06dbeSstefano_zampini mss = 0; 506*25d06dbeSstefano_zampini ierr = PetscCalloc1(pcis->n_B,&nnz);CHKERRQ(ierr); 507*25d06dbeSstefano_zampini if (sub_schurs->is_Ej_all) { 508*25d06dbeSstefano_zampini ierr = ISGetIndices(sub_schurs->is_Ej_all,&idxs);CHKERRQ(ierr); 509*25d06dbeSstefano_zampini for (i=0,cum=0;i<sub_schurs->n_subs;i++) { 510*25d06dbeSstefano_zampini PetscInt subset_size; 511*25d06dbeSstefano_zampini 512*25d06dbeSstefano_zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 513*25d06dbeSstefano_zampini for (j=0;j<subset_size;j++) nnz[idxs[j+cum]] = subset_size; 514*25d06dbeSstefano_zampini mss = PetscMax(mss,subset_size); 515*25d06dbeSstefano_zampini cum += subset_size; 516*25d06dbeSstefano_zampini } 517*25d06dbeSstefano_zampini } 518*25d06dbeSstefano_zampini ierr = MatCreate(PETSC_COMM_SELF,&T);CHKERRQ(ierr); 519*25d06dbeSstefano_zampini ierr = MatSetSizes(T,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr); 520*25d06dbeSstefano_zampini ierr = MatSetType(T,MATSEQAIJ);CHKERRQ(ierr); 521*25d06dbeSstefano_zampini ierr = MatSeqAIJSetPreallocation(T,0,nnz);CHKERRQ(ierr); 522*25d06dbeSstefano_zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 523*25d06dbeSstefano_zampini 524*25d06dbeSstefano_zampini /* workspace allocation */ 525*25d06dbeSstefano_zampini B_lwork = -1; 526*25d06dbeSstefano_zampini ierr = PetscBLASIntCast(mss,&B_N);CHKERRQ(ierr); 527*25d06dbeSstefano_zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 528*25d06dbeSstefano_zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,W,&B_N,&B_N,&lwork,&B_lwork,&B_ierr)); 529*25d06dbeSstefano_zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 530*25d06dbeSstefano_zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 531*25d06dbeSstefano_zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&B_lwork);CHKERRQ(ierr); 532*25d06dbeSstefano_zampini ierr = PetscMalloc3(mss*mss,&W,mss,&pivots,B_lwork,&Bwork);CHKERRQ(ierr); 533*25d06dbeSstefano_zampini 534*25d06dbeSstefano_zampini for (i=0,cum=0;i<sub_schurs->n_subs;i++) { 535*25d06dbeSstefano_zampini PetscScalar *M; 536*25d06dbeSstefano_zampini PetscInt subset_size; 537*25d06dbeSstefano_zampini 538*25d06dbeSstefano_zampini ierr = ISGetLocalSize(sub_schurs->is_subs[i],&subset_size);CHKERRQ(ierr); 539*25d06dbeSstefano_zampini ierr = PetscBLASIntCast(subset_size,&B_N);CHKERRQ(ierr); 540*25d06dbeSstefano_zampini ierr = MatDenseGetArray(deluxe_ctx->seq_mat[i],&M);CHKERRQ(ierr); 541*25d06dbeSstefano_zampini ierr = PetscMemcpy(W,M,subset_size*subset_size*sizeof(PetscScalar));CHKERRQ(ierr); 542*25d06dbeSstefano_zampini ierr = MatDenseRestoreArray(deluxe_ctx->seq_mat[i],&M);CHKERRQ(ierr); 543*25d06dbeSstefano_zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 544*25d06dbeSstefano_zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,W,&B_N,pivots,&B_ierr)); 545*25d06dbeSstefano_zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 546*25d06dbeSstefano_zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,W,&B_N,pivots,Bwork,&B_lwork,&B_ierr)); 547*25d06dbeSstefano_zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 548*25d06dbeSstefano_zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 549*25d06dbeSstefano_zampini ierr = MatSetValues(T,subset_size,idxs+cum,subset_size,idxs+cum,W,INSERT_VALUES);CHKERRQ(ierr); 550*25d06dbeSstefano_zampini cum += subset_size; 551*25d06dbeSstefano_zampini } 552*25d06dbeSstefano_zampini ierr = MatAssemblyBegin(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 553*25d06dbeSstefano_zampini ierr = MatAssemblyEnd(T,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 554*25d06dbeSstefano_zampini ierr = MatMatTransposeMult(T,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&BD1);CHKERRQ(ierr); 555*25d06dbeSstefano_zampini ierr = MatMatMult(fetidpmat_ctx->B_delta,BD1,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&BD2);CHKERRQ(ierr); 556*25d06dbeSstefano_zampini ierr = MatDestroy(&T);CHKERRQ(ierr); 557*25d06dbeSstefano_zampini ierr = PetscFree3(W,pivots,Bwork);CHKERRQ(ierr); 558*25d06dbeSstefano_zampini if (sub_schurs->is_Ej_all) { 559*25d06dbeSstefano_zampini ierr = ISRestoreIndices(sub_schurs->is_Ej_all,&idxs);CHKERRQ(ierr); 560*25d06dbeSstefano_zampini } 561*25d06dbeSstefano_zampini } 562674ae819SStefano Zampini } 563674ae819SStefano Zampini ierr = PetscFree(scaling_factors);CHKERRQ(ierr); 564674ae819SStefano Zampini ierr = PetscFree(cols_B_delta);CHKERRQ(ierr); 565674ae819SStefano Zampini 566457d4a33Sstefano_zampini /* Layout of multipliers */ 567457d4a33Sstefano_zampini ierr = PetscLayoutCreate(comm,&llay);CHKERRQ(ierr); 568457d4a33Sstefano_zampini ierr = PetscLayoutSetBlockSize(llay,1);CHKERRQ(ierr); 569457d4a33Sstefano_zampini ierr = PetscLayoutSetSize(llay,fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 570457d4a33Sstefano_zampini ierr = PetscLayoutSetUp(llay);CHKERRQ(ierr); 571457d4a33Sstefano_zampini ierr = PetscLayoutGetLocalSize(llay,&fetidpmat_ctx->n);CHKERRQ(ierr); 572457d4a33Sstefano_zampini 573457d4a33Sstefano_zampini /* Local work vector of multipliers */ 574457d4a33Sstefano_zampini ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 575457d4a33Sstefano_zampini ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 576457d4a33Sstefano_zampini ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr); 577457d4a33Sstefano_zampini 578*25d06dbeSstefano_zampini if (BD2) { 579*25d06dbeSstefano_zampini ISLocalToGlobalMapping l2g; 580*25d06dbeSstefano_zampini Mat T,TA,*pT; 581*25d06dbeSstefano_zampini IS is; 582*25d06dbeSstefano_zampini PetscInt nl,N; 583*25d06dbeSstefano_zampini BDdelta_DN ctx; 584*25d06dbeSstefano_zampini 585*25d06dbeSstefano_zampini ierr = PetscLayoutGetLocalSize(llay,&nl);CHKERRQ(ierr); 586*25d06dbeSstefano_zampini ierr = PetscLayoutGetSize(llay,&N);CHKERRQ(ierr); 587*25d06dbeSstefano_zampini ierr = MatCreate(comm,&T);CHKERRQ(ierr); 588*25d06dbeSstefano_zampini ierr = MatSetSizes(T,nl,nl,N,N);CHKERRQ(ierr); 589*25d06dbeSstefano_zampini ierr = MatSetType(T,MATIS);CHKERRQ(ierr); 590*25d06dbeSstefano_zampini ierr = ISLocalToGlobalMappingCreate(comm,1,n_local_lambda,l2g_indices,PETSC_COPY_VALUES,&l2g);CHKERRQ(ierr); 591*25d06dbeSstefano_zampini ierr = MatSetLocalToGlobalMapping(T,l2g,l2g);CHKERRQ(ierr); 592*25d06dbeSstefano_zampini ierr = ISLocalToGlobalMappingDestroy(&l2g);CHKERRQ(ierr); 593*25d06dbeSstefano_zampini ierr = MatISSetLocalMat(T,BD2);CHKERRQ(ierr); 594*25d06dbeSstefano_zampini ierr = MatDestroy(&BD2);CHKERRQ(ierr); 595*25d06dbeSstefano_zampini ierr = MatISGetMPIXAIJ(T,MAT_INITIAL_MATRIX,&TA);CHKERRQ(ierr); 596*25d06dbeSstefano_zampini ierr = MatDestroy(&T);CHKERRQ(ierr); 597*25d06dbeSstefano_zampini ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_USE_POINTER,&is);CHKERRQ(ierr); 598*25d06dbeSstefano_zampini ierr = MatGetSubMatrices(TA,1,&is,&is,MAT_INITIAL_MATRIX,&pT);CHKERRQ(ierr); 599*25d06dbeSstefano_zampini ierr = MatDestroy(&TA);CHKERRQ(ierr); 600*25d06dbeSstefano_zampini ierr = ISDestroy(&is);CHKERRQ(ierr); 601*25d06dbeSstefano_zampini BD2 = pT[0]; 602*25d06dbeSstefano_zampini ierr = PetscFree(pT);CHKERRQ(ierr); 603*25d06dbeSstefano_zampini 604*25d06dbeSstefano_zampini /* B_Ddelta for non-redundant multipliers with deluxe scaling */ 605*25d06dbeSstefano_zampini ierr = PetscNew(&ctx);CHKERRQ(ierr); 606*25d06dbeSstefano_zampini ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSHELL);CHKERRQ(ierr); 607*25d06dbeSstefano_zampini ierr = MatShellSetContext(fetidpmat_ctx->B_Ddelta,(void *)ctx);CHKERRQ(ierr); 608*25d06dbeSstefano_zampini ierr = MatShellSetOperation(fetidpmat_ctx->B_Ddelta,MATOP_MULT,(void (*)(void))MatMult_BDdelta_deluxe_nonred);CHKERRQ(ierr); 609*25d06dbeSstefano_zampini ierr = MatShellSetOperation(fetidpmat_ctx->B_Ddelta,MATOP_MULT_TRANSPOSE,(void (*)(void))MatMultTranspose_BDdelta_deluxe_nonred);CHKERRQ(ierr); 610*25d06dbeSstefano_zampini ierr = MatShellSetOperation(fetidpmat_ctx->B_Ddelta,MATOP_DESTROY,(void (*)(void))MatDestroy_BDdelta_deluxe_nonred);CHKERRQ(ierr); 611*25d06dbeSstefano_zampini ierr = MatSetUp(fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 612*25d06dbeSstefano_zampini 613*25d06dbeSstefano_zampini ierr = PetscObjectReference((PetscObject)BD1);CHKERRQ(ierr); 614*25d06dbeSstefano_zampini ctx->BD = BD1; 615*25d06dbeSstefano_zampini ierr = KSPCreate(PETSC_COMM_SELF,&ctx->kBD);CHKERRQ(ierr); 616*25d06dbeSstefano_zampini ierr = KSPSetOperators(ctx->kBD,BD2,BD2);CHKERRQ(ierr); 617*25d06dbeSstefano_zampini ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&ctx->work);CHKERRQ(ierr); 618*25d06dbeSstefano_zampini fetidpmat_ctx->deluxe_nonred = PETSC_TRUE; 619*25d06dbeSstefano_zampini } 620*25d06dbeSstefano_zampini ierr = MatDestroy(&BD1);CHKERRQ(ierr); 621*25d06dbeSstefano_zampini ierr = MatDestroy(&BD2);CHKERRQ(ierr); 622*25d06dbeSstefano_zampini 623*25d06dbeSstefano_zampini /* fetidpmat sizes */ 624*25d06dbeSstefano_zampini fetidpmat_ctx->n += nPgl; 625*25d06dbeSstefano_zampini fetidpmat_ctx->N = fetidpmat_ctx->n_lambda+nPg; 626*25d06dbeSstefano_zampini 627457d4a33Sstefano_zampini /* Global vector for FETI-DP linear system */ 628457d4a33Sstefano_zampini ierr = VecCreate(comm,&fetidp_global);CHKERRQ(ierr); 629457d4a33Sstefano_zampini ierr = VecSetSizes(fetidp_global,fetidpmat_ctx->n,fetidpmat_ctx->N);CHKERRQ(ierr); 630457d4a33Sstefano_zampini ierr = VecSetType(fetidp_global,VECMPI);CHKERRQ(ierr); 631457d4a33Sstefano_zampini ierr = VecSetUp(fetidp_global);CHKERRQ(ierr); 632457d4a33Sstefano_zampini 6339eec4de8Sstefano_zampini /* Decide layout for fetidp dofs: if it is a saddle point problem 6349eec4de8Sstefano_zampini pressure is ordered first in the local part of the global vector 635457d4a33Sstefano_zampini of the FETI-DP linear system */ 636457d4a33Sstefano_zampini if (nPg) { 637af140850Sstefano_zampini IS IS_l2g_p,ais; 638457d4a33Sstefano_zampini PetscLayout alay; 639457d4a33Sstefano_zampini const PetscInt *idxs,*pranges,*aranges,*lranges; 640af140850Sstefano_zampini PetscInt *l2g_indices_p,rst; 641457d4a33Sstefano_zampini 642457d4a33Sstefano_zampini ierr = PetscMalloc1(nPl,&l2g_indices_p);CHKERRQ(ierr); 643457d4a33Sstefano_zampini ierr = VecGetLayout(fetidp_global,&alay);CHKERRQ(ierr); 644457d4a33Sstefano_zampini ierr = PetscLayoutGetRanges(alay,&aranges);CHKERRQ(ierr); 645457d4a33Sstefano_zampini ierr = PetscLayoutGetRanges(play,&pranges);CHKERRQ(ierr); 646457d4a33Sstefano_zampini ierr = PetscLayoutGetRanges(llay,&lranges);CHKERRQ(ierr); 647457d4a33Sstefano_zampini ierr = ISLocalToGlobalMappingGetIndices(l2gmap_p,&idxs);CHKERRQ(ierr); 648af140850Sstefano_zampini /* shift local to global indices for pressure */ 649457d4a33Sstefano_zampini for (i=0;i<nPl;i++) { 650457d4a33Sstefano_zampini PetscInt owner; 651457d4a33Sstefano_zampini 652457d4a33Sstefano_zampini ierr = PetscLayoutFindOwner(play,idxs[i],&owner);CHKERRQ(ierr); 653457d4a33Sstefano_zampini l2g_indices_p[i] = idxs[i]-pranges[owner]+aranges[owner]; 654457d4a33Sstefano_zampini } 655457d4a33Sstefano_zampini ierr = ISLocalToGlobalMappingRestoreIndices(l2gmap_p,&idxs);CHKERRQ(ierr); 656457d4a33Sstefano_zampini ierr = ISCreateGeneral(comm,nPl,l2g_indices_p,PETSC_OWN_POINTER,&IS_l2g_p);CHKERRQ(ierr); 657af140850Sstefano_zampini 658457d4a33Sstefano_zampini /* local to global scatter for interface pressure */ 659457d4a33Sstefano_zampini ierr = VecScatterCreate(fetidpmat_ctx->vP,NULL,fetidp_global,IS_l2g_p,&fetidpmat_ctx->l2g_p);CHKERRQ(ierr); 660457d4a33Sstefano_zampini ierr = ISDestroy(&IS_l2g_p);CHKERRQ(ierr); 661457d4a33Sstefano_zampini 662af140850Sstefano_zampini /* shift local to global indices for multipliers */ 663457d4a33Sstefano_zampini for (i=0;i<n_local_lambda;i++) { 664457d4a33Sstefano_zampini PetscInt owner,ps; 665457d4a33Sstefano_zampini 666457d4a33Sstefano_zampini ierr = PetscLayoutFindOwner(llay,l2g_indices[i],&owner);CHKERRQ(ierr); 667457d4a33Sstefano_zampini ps = pranges[owner+1]-pranges[owner]; 668457d4a33Sstefano_zampini l2g_indices[i] = l2g_indices[i]-lranges[owner]+aranges[owner]+ps; 669457d4a33Sstefano_zampini } 670457d4a33Sstefano_zampini 6719cc7774eSstefano_zampini /* scatter from alldofs to interface pressures global fetidp vector */ 6729cc7774eSstefano_zampini ierr = PetscLayoutGetRange(alay,&rst,NULL);CHKERRQ(ierr); 6739cc7774eSstefano_zampini ierr = ISCreateStride(comm,nPgl,rst,1,&ais);CHKERRQ(ierr); 674af140850Sstefano_zampini ierr = VecScatterCreate(pcis->vec1_global,pP,fetidp_global,ais,&fetidpmat_ctx->g2g_p);CHKERRQ(ierr); 6759cc7774eSstefano_zampini ierr = ISDestroy(&ais);CHKERRQ(ierr); 676457d4a33Sstefano_zampini } 677457d4a33Sstefano_zampini ierr = PetscLayoutDestroy(&llay);CHKERRQ(ierr); 678457d4a33Sstefano_zampini ierr = PetscLayoutDestroy(&play);CHKERRQ(ierr); 679457d4a33Sstefano_zampini ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr); 680a1c0d0daSstefano_zampini 6819cc7774eSstefano_zampini /* scatter from local to global multipliers */ 682457d4a33Sstefano_zampini ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,NULL,fetidp_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr); 683457d4a33Sstefano_zampini ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr); 684457d4a33Sstefano_zampini ierr = ISLocalToGlobalMappingDestroy(&l2gmap_p);CHKERRQ(ierr); 685a1c0d0daSstefano_zampini ierr = VecDestroy(&fetidp_global);CHKERRQ(ierr); 686457d4a33Sstefano_zampini 687a1c0d0daSstefano_zampini /* Create some work vectors needed by fetidp */ 688674ae819SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr); 689674ae819SStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr); 690674ae819SStefano Zampini PetscFunctionReturn(0); 691674ae819SStefano Zampini } 692674ae819SStefano Zampini 693*25d06dbeSstefano_zampini 694674ae819SStefano Zampini #undef __FUNCT__ 695674ae819SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext" 696674ae819SStefano Zampini PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx fetidppc_ctx) 697674ae819SStefano Zampini { 698674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 699*25d06dbeSstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)fetidppc_ctx->pc->data; 700*25d06dbeSstefano_zampini PC_IS *pcis = (PC_IS*)fetidppc_ctx->pc->data; 701f28b6018SStefano Zampini PetscBool lumped = PETSC_FALSE; 702674ae819SStefano Zampini PetscErrorCode ierr; 703674ae819SStefano Zampini 704674ae819SStefano Zampini PetscFunctionBegin; 705674ae819SStefano Zampini ierr = MatShellGetContext(fetimat,(void**)&mat_ctx);CHKERRQ(ierr); 706674ae819SStefano Zampini /* get references from objects created when setting up feti mat context */ 707674ae819SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr); 708674ae819SStefano Zampini fetidppc_ctx->lambda_local = mat_ctx->lambda_local; 709674ae819SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr); 710674ae819SStefano Zampini fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta; 711*25d06dbeSstefano_zampini if (mat_ctx->deluxe_nonred) { 712*25d06dbeSstefano_zampini PC pc,mpc; 713*25d06dbeSstefano_zampini BDdelta_DN ctx; 714*25d06dbeSstefano_zampini MatSolverPackage solver; 715*25d06dbeSstefano_zampini const char *prefix; 716*25d06dbeSstefano_zampini 717*25d06dbeSstefano_zampini ierr = MatShellGetContext(mat_ctx->B_Ddelta,&ctx);CHKERRQ(ierr); 718*25d06dbeSstefano_zampini ierr = KSPSetType(ctx->kBD,KSPPREONLY);CHKERRQ(ierr); 719*25d06dbeSstefano_zampini ierr = KSPGetPC(ctx->kBD,&mpc);CHKERRQ(ierr); 720*25d06dbeSstefano_zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc);CHKERRQ(ierr); 721*25d06dbeSstefano_zampini ierr = PCSetType(mpc,PCLU);CHKERRQ(ierr); 722*25d06dbeSstefano_zampini ierr = PCFactorGetMatSolverPackage(pc,(const MatSolverPackage*)&solver);CHKERRQ(ierr); 723*25d06dbeSstefano_zampini if (solver) { 724*25d06dbeSstefano_zampini ierr = PCFactorSetMatSolverPackage(mpc,solver);CHKERRQ(ierr); 725*25d06dbeSstefano_zampini } 726*25d06dbeSstefano_zampini ierr = MatGetOptionsPrefix(fetimat,&prefix);CHKERRQ(ierr); 727*25d06dbeSstefano_zampini ierr = KSPSetOptionsPrefix(ctx->kBD,prefix);CHKERRQ(ierr); 728*25d06dbeSstefano_zampini ierr = KSPAppendOptionsPrefix(ctx->kBD,"bddelta_");CHKERRQ(ierr); 729*25d06dbeSstefano_zampini ierr = KSPSetFromOptions(ctx->kBD);CHKERRQ(ierr); 730*25d06dbeSstefano_zampini } 731*25d06dbeSstefano_zampini 732674ae819SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr); 733674ae819SStefano Zampini fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda; 734f28b6018SStefano Zampini /* Dirichlet preconditioner */ 7359c2d02cdSstefano_zampini ierr = PetscOptionsGetBool(NULL,((PetscObject)fetimat)->prefix,"-pc_lumped",&lumped,NULL);CHKERRQ(ierr); 736f28b6018SStefano Zampini if (!lumped) { 7379c2d02cdSstefano_zampini IS iP; 7389c2d02cdSstefano_zampini PetscBool discrete_harmonic = PETSC_FALSE; 7399c2d02cdSstefano_zampini 7409c2d02cdSstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidppc_ctx->pc,"__KSPFETIDP_iP",(PetscObject*)&iP);CHKERRQ(ierr); 7419c2d02cdSstefano_zampini if (iP) { 7429c2d02cdSstefano_zampini ierr = PetscOptionsGetBool(NULL,((PetscObject)fetimat)->prefix,"-pc_discrete_harmonic",&discrete_harmonic,NULL);CHKERRQ(ierr); 7439c2d02cdSstefano_zampini } 7449c2d02cdSstefano_zampini if (discrete_harmonic) { 7459c2d02cdSstefano_zampini KSP sksp; 7469c2d02cdSstefano_zampini PC pc; 7479c2d02cdSstefano_zampini Mat A_II,A_IB,A_BI; 7489c2d02cdSstefano_zampini IS aB; 7499c2d02cdSstefano_zampini PetscInt nb; 7505334bea6Sstefano_zampini PetscBool isshell; 7519c2d02cdSstefano_zampini KSPType ksptype; 7529c2d02cdSstefano_zampini const char *prefix; 7539c2d02cdSstefano_zampini 7549c2d02cdSstefano_zampini /* 7559c2d02cdSstefano_zampini We constructs a Schur complement for 7569c2d02cdSstefano_zampini 7579c2d02cdSstefano_zampini | A_II A_ID | 7589c2d02cdSstefano_zampini | A_DI A_DD | 7599c2d02cdSstefano_zampini 7609c2d02cdSstefano_zampini instead of 7619c2d02cdSstefano_zampini 7629c2d02cdSstefano_zampini | A_II B^t_II A_ID | 7639c2d02cdSstefano_zampini | B_II -C_II B_ID | 7649c2d02cdSstefano_zampini | A_DI B^t_ID A_DD | 7659c2d02cdSstefano_zampini 7669c2d02cdSstefano_zampini */ 7679c2d02cdSstefano_zampini ierr = ISGetLocalSize(pcis->is_B_local,&nb);CHKERRQ(ierr); 7689c2d02cdSstefano_zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)pcis->A_II),nb,0,1,&aB);CHKERRQ(ierr); 7699c2d02cdSstefano_zampini ierr = MatGetSubMatrix(pcis->A_II,iP,iP,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 7709c2d02cdSstefano_zampini ierr = MatGetSubMatrix(pcis->A_IB,iP,aB,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 7719c2d02cdSstefano_zampini ierr = MatGetSubMatrix(pcis->A_BI,aB,iP,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 7729c2d02cdSstefano_zampini ierr = MatCreateSchurComplement(A_II,A_II,A_IB,A_BI,pcis->A_BB,&fetidppc_ctx->S_j);CHKERRQ(ierr); 7739c2d02cdSstefano_zampini 7749c2d02cdSstefano_zampini /* propagate settings of solver */ 7759c2d02cdSstefano_zampini ierr = MatSchurComplementGetKSP(fetidppc_ctx->S_j,&sksp);CHKERRQ(ierr); 7769c2d02cdSstefano_zampini ierr = KSPGetType(pcis->ksp_D,&ksptype);CHKERRQ(ierr); 7779c2d02cdSstefano_zampini ierr = KSPSetType(sksp,ksptype);CHKERRQ(ierr); 7789c2d02cdSstefano_zampini ierr = KSPGetPC(pcis->ksp_D,&pc);CHKERRQ(ierr); 7795334bea6Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)pc,PCSHELL,&isshell);CHKERRQ(ierr); 7805334bea6Sstefano_zampini if (!isshell) { 7815334bea6Sstefano_zampini MatSolverPackage solver; 7825334bea6Sstefano_zampini PCType pctype; 7835334bea6Sstefano_zampini 7849c2d02cdSstefano_zampini ierr = PCGetType(pc,&pctype);CHKERRQ(ierr); 7859c2d02cdSstefano_zampini ierr = PCFactorGetMatSolverPackage(pc,(const MatSolverPackage*)&solver);CHKERRQ(ierr); 7869c2d02cdSstefano_zampini ierr = KSPGetPC(sksp,&pc);CHKERRQ(ierr); 7879c2d02cdSstefano_zampini ierr = PCSetType(pc,pctype);CHKERRQ(ierr); 7889c2d02cdSstefano_zampini if (solver) { 7899c2d02cdSstefano_zampini ierr = PCFactorSetMatSolverPackage(pc,solver);CHKERRQ(ierr); 7909c2d02cdSstefano_zampini } 7915334bea6Sstefano_zampini } else { 7925334bea6Sstefano_zampini ierr = KSPGetPC(sksp,&pc);CHKERRQ(ierr); 7935334bea6Sstefano_zampini ierr = PCSetType(pc,PCLU);CHKERRQ(ierr); 7945334bea6Sstefano_zampini } 7959c2d02cdSstefano_zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 7969c2d02cdSstefano_zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 7979c2d02cdSstefano_zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 7989c2d02cdSstefano_zampini ierr = ISDestroy(&aB);CHKERRQ(ierr); 7999c2d02cdSstefano_zampini ierr = MatGetOptionsPrefix(fetimat,&prefix);CHKERRQ(ierr); 8009c2d02cdSstefano_zampini ierr = KSPSetOptionsPrefix(sksp,prefix);CHKERRQ(ierr); 8019c2d02cdSstefano_zampini ierr = KSPAppendOptionsPrefix(sksp,"harmonic_");CHKERRQ(ierr); 8023016320fSstefano_zampini ierr = KSPSetFromOptions(sksp);CHKERRQ(ierr); 8039c2d02cdSstefano_zampini } else { /* default Dirichlet preconditioner is pde-harmonic */ 804ed6c3d69SStefano Zampini ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&fetidppc_ctx->S_j);CHKERRQ(ierr); 805ed6c3d69SStefano Zampini ierr = MatSchurComplementSetKSP(fetidppc_ctx->S_j,pcis->ksp_D);CHKERRQ(ierr); 8069c2d02cdSstefano_zampini } 807f28b6018SStefano Zampini } else { 808f28b6018SStefano Zampini ierr = PetscObjectReference((PetscObject)pcis->A_BB);CHKERRQ(ierr); 809f28b6018SStefano Zampini fetidppc_ctx->S_j = pcis->A_BB; 810f28b6018SStefano Zampini } 811af140850Sstefano_zampini /* saddle-point */ 812af140850Sstefano_zampini if (mat_ctx->xPg) { 813af140850Sstefano_zampini ierr = PetscObjectReference((PetscObject)mat_ctx->xPg);CHKERRQ(ierr); 814af140850Sstefano_zampini fetidppc_ctx->xPg = mat_ctx->xPg; 815af140850Sstefano_zampini ierr = PetscObjectReference((PetscObject)mat_ctx->yPg);CHKERRQ(ierr); 816af140850Sstefano_zampini fetidppc_ctx->yPg = mat_ctx->yPg; 8176cc1294bSstefano_zampini ierr = PetscObjectQuery((PetscObject)fetidppc_ctx->pc,"__KSPFETIDP_PKSP",(PetscObject*)&fetidppc_ctx->kP);CHKERRQ(ierr); 8186cc1294bSstefano_zampini ierr = PetscObjectReference((PetscObject)fetidppc_ctx->kP);CHKERRQ(ierr); 819af140850Sstefano_zampini } 820674ae819SStefano Zampini PetscFunctionReturn(0); 821674ae819SStefano Zampini } 822674ae819SStefano Zampini 823674ae819SStefano Zampini #undef __FUNCT__ 824674ae819SStefano Zampini #define __FUNCT__ "FETIDPMatMult" 825674ae819SStefano Zampini PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y) 826674ae819SStefano Zampini { 827674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 828617d11aeSStefano Zampini PC_BDDC *pcbddc; 829674ae819SStefano Zampini PC_IS *pcis; 830674ae819SStefano Zampini PetscErrorCode ierr; 831674ae819SStefano Zampini 832674ae819SStefano Zampini PetscFunctionBegin; 833674ae819SStefano Zampini ierr = MatShellGetContext(fetimat,(void**)&mat_ctx);CHKERRQ(ierr); 834674ae819SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 835617d11aeSStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 836674ae819SStefano Zampini /* Application of B_delta^T */ 837af140850Sstefano_zampini ierr = VecSet(pcis->vec1_B,0.);CHKERRQ(ierr); 838674ae819SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 839674ae819SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 840674ae819SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 841af140850Sstefano_zampini 842af140850Sstefano_zampini /* Add contribution from saddle point */ 843af140850Sstefano_zampini if (mat_ctx->l2g_p) { 844af140850Sstefano_zampini ierr = VecScatterBegin(mat_ctx->l2g_p,x,mat_ctx->vP,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 845af140850Sstefano_zampini ierr = VecScatterEnd(mat_ctx->l2g_p,x,mat_ctx->vP,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 846af140850Sstefano_zampini if (pcbddc->switch_static) { 847af140850Sstefano_zampini ierr = MatMult(mat_ctx->Bt_BI,mat_ctx->vP,pcis->vec1_D);CHKERRQ(ierr); 848af140850Sstefano_zampini } 849af140850Sstefano_zampini ierr = MatMultAdd(mat_ctx->Bt_BB,mat_ctx->vP,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 850af140850Sstefano_zampini } else { 851af140850Sstefano_zampini if (pcbddc->switch_static) { 852674ae819SStefano Zampini ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr); 853af140850Sstefano_zampini } 854af140850Sstefano_zampini } 855af140850Sstefano_zampini /* Application of \widetilde{S}^-1 */ 856617d11aeSStefano Zampini ierr = PetscMemzero(pcbddc->benign_p0,pcbddc->benign_n*sizeof(PetscScalar));CHKERRQ(ierr); 857dc359a40SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc,PETSC_FALSE);CHKERRQ(ierr); 858c7ffc8ceSStefano Zampini ierr = PetscMemzero(pcbddc->benign_p0,pcbddc->benign_n*sizeof(PetscScalar));CHKERRQ(ierr); 859af140850Sstefano_zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 860674ae819SStefano Zampini /* Application of B_delta */ 861674ae819SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 862af140850Sstefano_zampini /* Contribution from boundary pressures */ 863af140850Sstefano_zampini if (mat_ctx->C) { 864af140850Sstefano_zampini const PetscScalar *lx; 865af140850Sstefano_zampini PetscScalar *ly; 866af140850Sstefano_zampini 867af140850Sstefano_zampini /* pressures ordered first in x and y */ 868af140850Sstefano_zampini ierr = VecGetArrayRead(x,&lx);CHKERRQ(ierr); 869af140850Sstefano_zampini ierr = VecGetArray(y,&ly);CHKERRQ(ierr); 870af140850Sstefano_zampini ierr = VecPlaceArray(mat_ctx->xPg,lx);CHKERRQ(ierr); 871af140850Sstefano_zampini ierr = VecPlaceArray(mat_ctx->yPg,ly);CHKERRQ(ierr); 872af140850Sstefano_zampini ierr = MatMult(mat_ctx->C,mat_ctx->xPg,mat_ctx->yPg);CHKERRQ(ierr); 873af140850Sstefano_zampini ierr = VecResetArray(mat_ctx->xPg);CHKERRQ(ierr); 874af140850Sstefano_zampini ierr = VecResetArray(mat_ctx->yPg);CHKERRQ(ierr); 875af140850Sstefano_zampini ierr = VecRestoreArrayRead(x,&lx);CHKERRQ(ierr); 876af140850Sstefano_zampini ierr = VecRestoreArray(y,&ly);CHKERRQ(ierr); 877af140850Sstefano_zampini } 878af140850Sstefano_zampini /* Add contribution from saddle point */ 879af140850Sstefano_zampini if (mat_ctx->l2g_p) { 880af140850Sstefano_zampini ierr = MatMult(mat_ctx->B_BB,pcis->vec1_B,mat_ctx->vP);CHKERRQ(ierr); 881af140850Sstefano_zampini if (pcbddc->switch_static) { 882af140850Sstefano_zampini ierr = MatMultAdd(mat_ctx->B_BI,pcis->vec1_D,mat_ctx->vP,mat_ctx->vP);CHKERRQ(ierr); 883af140850Sstefano_zampini } 884af140850Sstefano_zampini ierr = VecScatterBegin(mat_ctx->l2g_p,mat_ctx->vP,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 885af140850Sstefano_zampini ierr = VecScatterEnd(mat_ctx->l2g_p,mat_ctx->vP,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 886af140850Sstefano_zampini } 887674ae819SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 888674ae819SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 889674ae819SStefano Zampini PetscFunctionReturn(0); 890674ae819SStefano Zampini } 891674ae819SStefano Zampini 892674ae819SStefano Zampini #undef __FUNCT__ 893edf7251bSStefano Zampini #define __FUNCT__ "FETIDPMatMultTranspose" 894edf7251bSStefano Zampini PetscErrorCode FETIDPMatMultTranspose(Mat fetimat, Vec x, Vec y) 895edf7251bSStefano Zampini { 896edf7251bSStefano Zampini FETIDPMat_ctx mat_ctx; 897edf7251bSStefano Zampini PC_IS *pcis; 898edf7251bSStefano Zampini PetscErrorCode ierr; 899edf7251bSStefano Zampini 900edf7251bSStefano Zampini PetscFunctionBegin; 901edf7251bSStefano Zampini ierr = MatShellGetContext(fetimat,(void**)&mat_ctx);CHKERRQ(ierr); 902edf7251bSStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 903edf7251bSStefano Zampini /* Application of B_delta^T */ 904edf7251bSStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 905edf7251bSStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 906edf7251bSStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 907edf7251bSStefano Zampini /* Application of \widetilde{S}^-1 */ 908edf7251bSStefano Zampini ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr); 909edf7251bSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc,PETSC_TRUE);CHKERRQ(ierr); 910edf7251bSStefano Zampini /* Application of B_delta */ 911edf7251bSStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 912edf7251bSStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 913edf7251bSStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 914edf7251bSStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 915edf7251bSStefano Zampini PetscFunctionReturn(0); 916edf7251bSStefano Zampini } 917edf7251bSStefano Zampini 918edf7251bSStefano Zampini #undef __FUNCT__ 919674ae819SStefano Zampini #define __FUNCT__ "FETIDPPCApply" 920674ae819SStefano Zampini PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y) 921674ae819SStefano Zampini { 922674ae819SStefano Zampini FETIDPPC_ctx pc_ctx; 923674ae819SStefano Zampini PC_IS *pcis; 924674ae819SStefano Zampini PetscErrorCode ierr; 925674ae819SStefano Zampini 926674ae819SStefano Zampini PetscFunctionBegin; 927302440fdSBarry Smith ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);CHKERRQ(ierr); 928674ae819SStefano Zampini pcis = (PC_IS*)pc_ctx->pc->data; 929674ae819SStefano Zampini /* Application of B_Ddelta^T */ 930674ae819SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 931674ae819SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 932674ae819SStefano Zampini ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr); 933674ae819SStefano Zampini ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr); 934ed6c3d69SStefano Zampini /* Application of local Schur complement */ 935ed6c3d69SStefano Zampini ierr = MatMult(pc_ctx->S_j,pcis->vec2_B,pcis->vec1_B);CHKERRQ(ierr); 936edf7251bSStefano Zampini /* Application of B_Ddelta */ 937edf7251bSStefano Zampini ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr); 938edf7251bSStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 939edf7251bSStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 940edf7251bSStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 941b519380fSstefano_zampini /* interface pressure preconditioner */ 942b519380fSstefano_zampini if (pc_ctx->kP) { 943b519380fSstefano_zampini const PetscScalar *lx; 944b519380fSstefano_zampini PetscScalar *ly; 945b519380fSstefano_zampini 946b519380fSstefano_zampini /* pressures ordered first in x and y */ 947b519380fSstefano_zampini ierr = VecGetArrayRead(x,&lx);CHKERRQ(ierr); 948b519380fSstefano_zampini ierr = VecGetArray(y,&ly);CHKERRQ(ierr); 949b519380fSstefano_zampini ierr = VecPlaceArray(pc_ctx->xPg,lx);CHKERRQ(ierr); 950b519380fSstefano_zampini ierr = VecPlaceArray(pc_ctx->yPg,ly);CHKERRQ(ierr); 951b519380fSstefano_zampini ierr = KSPSolve(pc_ctx->kP,pc_ctx->xPg,pc_ctx->yPg);CHKERRQ(ierr); 952b519380fSstefano_zampini ierr = VecResetArray(pc_ctx->xPg);CHKERRQ(ierr); 953b519380fSstefano_zampini ierr = VecResetArray(pc_ctx->yPg);CHKERRQ(ierr); 954b519380fSstefano_zampini ierr = VecRestoreArrayRead(x,&lx);CHKERRQ(ierr); 955b519380fSstefano_zampini ierr = VecRestoreArray(y,&ly);CHKERRQ(ierr); 956b519380fSstefano_zampini } 957edf7251bSStefano Zampini PetscFunctionReturn(0); 958edf7251bSStefano Zampini } 959edf7251bSStefano Zampini 960edf7251bSStefano Zampini #undef __FUNCT__ 961edf7251bSStefano Zampini #define __FUNCT__ "FETIDPPCApplyTranspose" 962edf7251bSStefano Zampini PetscErrorCode FETIDPPCApplyTranspose(PC fetipc, Vec x, Vec y) 963edf7251bSStefano Zampini { 964edf7251bSStefano Zampini FETIDPPC_ctx pc_ctx; 965edf7251bSStefano Zampini PC_IS *pcis; 966edf7251bSStefano Zampini PetscErrorCode ierr; 967edf7251bSStefano Zampini 968edf7251bSStefano Zampini PetscFunctionBegin; 969302440fdSBarry Smith ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);CHKERRQ(ierr); 970edf7251bSStefano Zampini pcis = (PC_IS*)pc_ctx->pc->data; 971edf7251bSStefano Zampini /* Application of B_Ddelta^T */ 972edf7251bSStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 973edf7251bSStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 974edf7251bSStefano Zampini ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr); 975edf7251bSStefano Zampini ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr); 976ed6c3d69SStefano Zampini /* Application of local Schur complement */ 977ed6c3d69SStefano Zampini ierr = MatMultTranspose(pc_ctx->S_j,pcis->vec2_B,pcis->vec1_B);CHKERRQ(ierr); 978674ae819SStefano Zampini /* Application of B_Ddelta */ 979674ae819SStefano Zampini ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr); 980674ae819SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 981674ae819SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 982674ae819SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 983674ae819SStefano Zampini PetscFunctionReturn(0); 984674ae819SStefano Zampini } 985c45b8d2dSstefano_zampini 986c45b8d2dSstefano_zampini #undef __FUNCT__ 987c45b8d2dSstefano_zampini #define __FUNCT__ "FETIDPPCView" 988c45b8d2dSstefano_zampini PetscErrorCode FETIDPPCView(PC pc, PetscViewer viewer) 989c45b8d2dSstefano_zampini { 990c45b8d2dSstefano_zampini FETIDPPC_ctx pc_ctx; 991c45b8d2dSstefano_zampini PetscBool iascii; 992c45b8d2dSstefano_zampini PetscViewer sviewer; 993c45b8d2dSstefano_zampini PetscErrorCode ierr; 994c45b8d2dSstefano_zampini 995c45b8d2dSstefano_zampini PetscFunctionBegin; 996c45b8d2dSstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 997c45b8d2dSstefano_zampini if (iascii) { 998c45b8d2dSstefano_zampini PetscMPIInt rank; 999*25d06dbeSstefano_zampini PetscBool isschur,isshell; 1000c45b8d2dSstefano_zampini 1001c45b8d2dSstefano_zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 1002c45b8d2dSstefano_zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)pc),&rank);CHKERRQ(ierr); 1003c45b8d2dSstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)pc_ctx->S_j,MATSCHURCOMPLEMENT,&isschur);CHKERRQ(ierr); 1004c45b8d2dSstefano_zampini if (isschur) { 1005c45b8d2dSstefano_zampini ierr = PetscViewerASCIIPrintf(viewer," FETI-DP multipliers Dirichlet preconditioner (just from rank 0)\n");CHKERRQ(ierr); 1006c45b8d2dSstefano_zampini } else { 1007c45b8d2dSstefano_zampini ierr = PetscViewerASCIIPrintf(viewer," FETI-DP multipliers Lumped preconditioner (just from rank 0)\n");CHKERRQ(ierr); 1008c45b8d2dSstefano_zampini } 1009c45b8d2dSstefano_zampini ierr = PetscViewerGetSubViewer(viewer,PetscObjectComm((PetscObject)pc_ctx->S_j),&sviewer);CHKERRQ(ierr); 1010c45b8d2dSstefano_zampini if (!rank) { 1011c45b8d2dSstefano_zampini ierr = PetscViewerPushFormat(sviewer,PETSC_VIEWER_ASCII_INFO);CHKERRQ(ierr); 1012c45b8d2dSstefano_zampini ierr = PetscViewerASCIIAddTab(sviewer,2);CHKERRQ(ierr); 1013c45b8d2dSstefano_zampini ierr = MatView(pc_ctx->S_j,sviewer);CHKERRQ(ierr); 1014c45b8d2dSstefano_zampini ierr = PetscViewerASCIISubtractTab(sviewer,2);CHKERRQ(ierr); 1015c45b8d2dSstefano_zampini ierr = PetscViewerPopFormat(sviewer);CHKERRQ(ierr); 1016c45b8d2dSstefano_zampini } 1017*25d06dbeSstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)pc_ctx->B_Ddelta,MATSHELL,&isshell);CHKERRQ(ierr); 1018*25d06dbeSstefano_zampini if (isshell) { 1019*25d06dbeSstefano_zampini BDdelta_DN ctx; 1020*25d06dbeSstefano_zampini ierr = PetscViewerASCIIPrintf(viewer," FETI-DP BDdelta: DB^t * (B D^-1 B^t)^-1 for deluxe scaling (just from rank 0)\n");CHKERRQ(ierr); 1021*25d06dbeSstefano_zampini ierr = MatShellGetContext(pc_ctx->B_Ddelta,&ctx);CHKERRQ(ierr); 1022*25d06dbeSstefano_zampini if (!rank) { 1023*25d06dbeSstefano_zampini ierr = PetscViewerASCIIAddTab(sviewer,2);CHKERRQ(ierr); 1024*25d06dbeSstefano_zampini ierr = KSPView(ctx->kBD,sviewer);CHKERRQ(ierr); 1025*25d06dbeSstefano_zampini ierr = PetscViewerPushFormat(sviewer,PETSC_VIEWER_ASCII_INFO);CHKERRQ(ierr); 1026*25d06dbeSstefano_zampini ierr = MatView(ctx->BD,sviewer);CHKERRQ(ierr); 1027*25d06dbeSstefano_zampini ierr = PetscViewerASCIISubtractTab(sviewer,2);CHKERRQ(ierr); 1028*25d06dbeSstefano_zampini ierr = PetscViewerPopFormat(sviewer);CHKERRQ(ierr); 1029*25d06dbeSstefano_zampini } 1030*25d06dbeSstefano_zampini } 1031c45b8d2dSstefano_zampini ierr = PetscViewerRestoreSubViewer(viewer,PetscObjectComm((PetscObject)pc_ctx->S_j),&sviewer);CHKERRQ(ierr); 1032c45b8d2dSstefano_zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 1033c45b8d2dSstefano_zampini if (pc_ctx->kP) { 1034c45b8d2dSstefano_zampini ierr = PetscViewerASCIIPrintf(viewer," FETI-DP pressure preconditioner\n");CHKERRQ(ierr); 1035c45b8d2dSstefano_zampini ierr = PetscViewerASCIIAddTab(viewer,2);CHKERRQ(ierr); 1036c45b8d2dSstefano_zampini ierr = KSPView(pc_ctx->kP,viewer);CHKERRQ(ierr); 1037c45b8d2dSstefano_zampini ierr = PetscViewerASCIISubtractTab(viewer,2);CHKERRQ(ierr); 1038c45b8d2dSstefano_zampini } 1039c45b8d2dSstefano_zampini } 1040c45b8d2dSstefano_zampini PetscFunctionReturn(0); 1041c45b8d2dSstefano_zampini } 1042