1ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddc.h> 2ab5c6b0cSJed Brown #include <../src/ksp/pc/impls/bddc/bddcprivate.h> 3674ae819SStefano Zampini 434a97f8cSStefano Zampini /* prototypes for deluxe functions */ 534a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingCreate_Deluxe(PC); 634a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingDestroy_Deluxe(PC); 734a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingSetUp_Deluxe(PC); 834a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Par(PC,PetscInt,PetscInt,PetscInt[],PetscInt[]); 9883469d8SStefano Zampini static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Seq(PC); 1034a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingReset_Deluxe_Solvers(PCBDDCDeluxeScaling); 11674ae819SStefano Zampini 12674ae819SStefano Zampini #undef __FUNCT__ 13674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingExtension_Basic" 14674ae819SStefano Zampini static PetscErrorCode PCBDDCScalingExtension_Basic(PC pc, Vec local_interface_vector, Vec global_vector) 15674ae819SStefano Zampini { 16674ae819SStefano Zampini PC_IS* pcis = (PC_IS*)pc->data; 17674ae819SStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 18674ae819SStefano Zampini PetscErrorCode ierr; 19674ae819SStefano Zampini 20674ae819SStefano Zampini PetscFunctionBegin; 21674ae819SStefano Zampini /* Apply partition of unity */ 22674ae819SStefano Zampini ierr = VecPointwiseMult(pcbddc->work_scaling,pcis->D,local_interface_vector);CHKERRQ(ierr); 23674ae819SStefano Zampini ierr = VecSet(global_vector,0.0);CHKERRQ(ierr); 24674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcbddc->work_scaling,global_vector,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 25674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcbddc->work_scaling,global_vector,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 26674ae819SStefano Zampini PetscFunctionReturn(0); 27674ae819SStefano Zampini } 28674ae819SStefano Zampini 29674ae819SStefano Zampini #undef __FUNCT__ 30674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingExtension_Deluxe" 31674ae819SStefano Zampini static PetscErrorCode PCBDDCScalingExtension_Deluxe(PC pc, Vec x, Vec y) 32674ae819SStefano Zampini { 33674ae819SStefano Zampini PC_IS* pcis=(PC_IS*)pc->data; 34674ae819SStefano Zampini PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 35674ae819SStefano Zampini PCBDDCDeluxeScaling deluxe_ctx = pcbddc->deluxe_ctx; 36b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 37674ae819SStefano Zampini PetscInt i; 38674ae819SStefano Zampini PetscErrorCode ierr; 39674ae819SStefano Zampini 40674ae819SStefano Zampini /* TODO CHECK STUFF RELATED WITH FAKE WORK */ 41674ae819SStefano Zampini PetscFunctionBegin; 4234a97f8cSStefano Zampini ierr = VecSet(pcbddc->work_scaling,0.0);CHKERRQ(ierr); /* needed by the fake work below */ 4334a97f8cSStefano Zampini if (deluxe_ctx->n_simple) { 44674ae819SStefano Zampini /* scale deluxe vertices using diagonal scaling */ 452b095fd8SStefano Zampini const PetscScalar *array_x,*array_D; 462b095fd8SStefano Zampini PetscScalar *array; 472b095fd8SStefano Zampini ierr = VecGetArrayRead(x,&array_x);CHKERRQ(ierr); 482b095fd8SStefano Zampini ierr = VecGetArrayRead(pcis->D,&array_D);CHKERRQ(ierr); 49674ae819SStefano Zampini ierr = VecGetArray(pcbddc->work_scaling,&array);CHKERRQ(ierr); 50674ae819SStefano Zampini for (i=0;i<deluxe_ctx->n_simple;i++) { 51674ae819SStefano Zampini array[deluxe_ctx->idx_simple_B[i]] = array_x[deluxe_ctx->idx_simple_B[i]]*array_D[deluxe_ctx->idx_simple_B[i]]; 52674ae819SStefano Zampini } 53674ae819SStefano Zampini ierr = VecRestoreArray(pcbddc->work_scaling,&array);CHKERRQ(ierr); 542b095fd8SStefano Zampini ierr = VecRestoreArrayRead(pcis->D,&array_D);CHKERRQ(ierr); 552b095fd8SStefano Zampini ierr = VecRestoreArrayRead(x,&array_x);CHKERRQ(ierr); 5634a97f8cSStefano Zampini } 5734a97f8cSStefano Zampini /* sequential part : all problems and Schur applications collapsed into a single matrix vector multiplication and ksp solution */ 5841c3ba1bSStefano Zampini if (deluxe_ctx->seq_ksp) { 59674ae819SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->seq_scctx,x,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 60674ae819SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->seq_scctx,x,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 611d850880SStefano Zampini ierr = MatMultTranspose(sub_schurs->S_Ej_all,deluxe_ctx->seq_work1,deluxe_ctx->seq_work2);CHKERRQ(ierr); 621d850880SStefano Zampini ierr = KSPSolveTranspose(deluxe_ctx->seq_ksp,deluxe_ctx->seq_work2,deluxe_ctx->seq_work1);CHKERRQ(ierr); 63674ae819SStefano Zampini /* fake work due to final ADD VALUES and vertices scaling needed? TODO: check it */ 64674ae819SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 65674ae819SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 66674ae819SStefano Zampini } 67674ae819SStefano Zampini /* parallel part */ 68674ae819SStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 69674ae819SStefano Zampini if (deluxe_ctx->par_ksp[i]) { 7034a97f8cSStefano Zampini PetscMPIInt color_rank; 7134a97f8cSStefano Zampini PetscInt subidx = deluxe_ctx->par_col2sub[i]; 7234a97f8cSStefano Zampini /* restrict on subset */ 73b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],x,deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 74b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],x,deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7534a97f8cSStefano Zampini /* S_Ej */ 76b96c3477SStefano Zampini ierr = MatMult(sub_schurs->S_Ej[subidx],deluxe_ctx->par_work1[i],deluxe_ctx->par_work2[i]);CHKERRQ(ierr); 7734a97f8cSStefano Zampini /* (\sum_j S_Ej)^-1 */ 7834a97f8cSStefano Zampini ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 79b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work2[i],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 80b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work2[i],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 81674ae819SStefano Zampini ierr = KSPSolve(deluxe_ctx->par_ksp[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 8234a97f8cSStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)deluxe_ctx->par_ksp[i]),&color_rank);CHKERRQ(ierr); 8334a97f8cSStefano Zampini /* get back solution on subset */ 84b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 85b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8634a97f8cSStefano Zampini if (!color_rank) { /* only the master process in coloured comm copies the computed values */ 87b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],deluxe_ctx->par_work1[i],pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 88b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],deluxe_ctx->par_work1[i],pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 89674ae819SStefano Zampini } 90674ae819SStefano Zampini } 91674ae819SStefano Zampini } 92674ae819SStefano Zampini /* put local boundary part in global vector */ 9334a97f8cSStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 94674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcbddc->work_scaling,y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 95674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcbddc->work_scaling,y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 96674ae819SStefano Zampini PetscFunctionReturn(0); 97674ae819SStefano Zampini } 98674ae819SStefano Zampini 99674ae819SStefano Zampini #undef __FUNCT__ 100674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingExtension" 101674ae819SStefano Zampini PetscErrorCode PCBDDCScalingExtension(PC pc, Vec local_interface_vector, Vec global_vector) 102674ae819SStefano Zampini { 103674ae819SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 104674ae819SStefano Zampini PetscErrorCode ierr; 105674ae819SStefano Zampini 106674ae819SStefano Zampini PetscFunctionBegin; 107674ae819SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 108674ae819SStefano Zampini PetscValidHeaderSpecific(local_interface_vector,VEC_CLASSID,2); 109674ae819SStefano Zampini PetscValidHeaderSpecific(global_vector,VEC_CLASSID,3); 110674ae819SStefano Zampini if (local_interface_vector == pcbddc->work_scaling) { 111674ae819SStefano Zampini SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Local vector cannot be pcbddc->work_scaling!\n"); 112674ae819SStefano Zampini } 113674ae819SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCScalingExtension_C",(PC,Vec,Vec),(pc,local_interface_vector,global_vector));CHKERRQ(ierr); 114674ae819SStefano Zampini PetscFunctionReturn(0); 115674ae819SStefano Zampini } 116674ae819SStefano Zampini 117674ae819SStefano Zampini #undef __FUNCT__ 118674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingRestriction_Basic" 119674ae819SStefano Zampini static PetscErrorCode PCBDDCScalingRestriction_Basic(PC pc, Vec global_vector, Vec local_interface_vector) 120674ae819SStefano Zampini { 121674ae819SStefano Zampini PetscErrorCode ierr; 122674ae819SStefano Zampini PC_IS* pcis = (PC_IS*)pc->data; 123674ae819SStefano Zampini 124674ae819SStefano Zampini PetscFunctionBegin; 125674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,global_vector,local_interface_vector,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 126674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,global_vector,local_interface_vector,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 127674ae819SStefano Zampini /* Apply partition of unity */ 128674ae819SStefano Zampini ierr = VecPointwiseMult(local_interface_vector,pcis->D,local_interface_vector);CHKERRQ(ierr); 129674ae819SStefano Zampini PetscFunctionReturn(0); 130674ae819SStefano Zampini } 131674ae819SStefano Zampini 132674ae819SStefano Zampini #undef __FUNCT__ 133674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingRestriction_Deluxe" 134674ae819SStefano Zampini static PetscErrorCode PCBDDCScalingRestriction_Deluxe(PC pc, Vec x, Vec y) 135674ae819SStefano Zampini { 136674ae819SStefano Zampini PC_IS* pcis=(PC_IS*)pc->data; 137674ae819SStefano Zampini PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 138674ae819SStefano Zampini PCBDDCDeluxeScaling deluxe_ctx = pcbddc->deluxe_ctx; 139b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 140674ae819SStefano Zampini PetscInt i; 141674ae819SStefano Zampini PetscErrorCode ierr; 142674ae819SStefano Zampini 143674ae819SStefano Zampini PetscFunctionBegin; 144674ae819SStefano Zampini /* get local boundary part of global vector */ 145674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 146674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,x,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 14734a97f8cSStefano Zampini if (deluxe_ctx->n_simple) { 14834a97f8cSStefano Zampini /* scale deluxe vertices using diagonal scaling */ 1492b095fd8SStefano Zampini PetscScalar *array_y; 1502b095fd8SStefano Zampini const PetscScalar *array_D; 151674ae819SStefano Zampini ierr = VecGetArray(y,&array_y);CHKERRQ(ierr); 1522b095fd8SStefano Zampini ierr = VecGetArrayRead(pcis->D,&array_D);CHKERRQ(ierr); 153674ae819SStefano Zampini for (i=0;i<deluxe_ctx->n_simple;i++) { 154674ae819SStefano Zampini array_y[deluxe_ctx->idx_simple_B[i]] *= array_D[deluxe_ctx->idx_simple_B[i]]; 155674ae819SStefano Zampini } 1562b095fd8SStefano Zampini ierr = VecRestoreArrayRead(pcis->D,&array_D);CHKERRQ(ierr); 157674ae819SStefano Zampini ierr = VecRestoreArray(y,&array_y);CHKERRQ(ierr); 15834a97f8cSStefano Zampini } 15934a97f8cSStefano Zampini /* sequential part : all problems and Schur applications collapsed into a single matrix vector multiplication and ksp solution */ 16041c3ba1bSStefano Zampini if (deluxe_ctx->seq_ksp) { 161674ae819SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->seq_scctx,y,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 162674ae819SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->seq_scctx,y,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1631d850880SStefano Zampini ierr = KSPSolve(deluxe_ctx->seq_ksp,deluxe_ctx->seq_work1,deluxe_ctx->seq_work2);CHKERRQ(ierr); 1641d850880SStefano Zampini ierr = MatMult(sub_schurs->S_Ej_all,deluxe_ctx->seq_work2,deluxe_ctx->seq_work1);CHKERRQ(ierr); 165674ae819SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 166674ae819SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 167674ae819SStefano Zampini } 168674ae819SStefano Zampini /* parallel part */ 169674ae819SStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 170674ae819SStefano Zampini if (deluxe_ctx->par_ksp[i]) { 17134a97f8cSStefano Zampini PetscInt subidx = deluxe_ctx->par_col2sub[i]; 17234a97f8cSStefano Zampini /* restrict on subset */ 173b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],y,deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 174b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],y,deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17534a97f8cSStefano Zampini /* (\sum_j S_Ej)^-T */ 17634a97f8cSStefano Zampini ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 177b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work1[i],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 178b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work1[i],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 179674ae819SStefano Zampini ierr = KSPSolveTranspose(deluxe_ctx->par_ksp[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 180b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 181b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18234a97f8cSStefano Zampini /* S_Ej^T */ 183b96c3477SStefano Zampini ierr = MatMultTranspose(sub_schurs->S_Ej[subidx],deluxe_ctx->par_work1[i],deluxe_ctx->par_work2[i]);CHKERRQ(ierr); 18434a97f8cSStefano Zampini /* extend to boundary */ 185b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],deluxe_ctx->par_work2[i],y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 186b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],deluxe_ctx->par_work2[i],y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 187674ae819SStefano Zampini } 188674ae819SStefano Zampini } 189674ae819SStefano Zampini PetscFunctionReturn(0); 190674ae819SStefano Zampini } 191674ae819SStefano Zampini 192674ae819SStefano Zampini #undef __FUNCT__ 193674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingRestriction" 194674ae819SStefano Zampini PetscErrorCode PCBDDCScalingRestriction(PC pc, Vec global_vector, Vec local_interface_vector) 195674ae819SStefano Zampini { 196674ae819SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 197674ae819SStefano Zampini PetscErrorCode ierr; 198674ae819SStefano Zampini 199674ae819SStefano Zampini PetscFunctionBegin; 200674ae819SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 201674ae819SStefano Zampini PetscValidHeaderSpecific(global_vector,VEC_CLASSID,2); 202674ae819SStefano Zampini PetscValidHeaderSpecific(local_interface_vector,VEC_CLASSID,3); 203674ae819SStefano Zampini if (local_interface_vector == pcbddc->work_scaling) { 204674ae819SStefano Zampini SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Local vector should cannot be pcbddc->work_scaling!\n"); 205674ae819SStefano Zampini } 206674ae819SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCScalingRestriction_C",(PC,Vec,Vec),(pc,global_vector,local_interface_vector));CHKERRQ(ierr); 207674ae819SStefano Zampini PetscFunctionReturn(0); 208674ae819SStefano Zampini } 209674ae819SStefano Zampini 210674ae819SStefano Zampini #undef __FUNCT__ 211674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingSetUp" 212674ae819SStefano Zampini PetscErrorCode PCBDDCScalingSetUp(PC pc) 213674ae819SStefano Zampini { 214674ae819SStefano Zampini PC_IS* pcis=(PC_IS*)pc->data; 215674ae819SStefano Zampini PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 216674ae819SStefano Zampini PetscErrorCode ierr; 217674ae819SStefano Zampini 218674ae819SStefano Zampini PetscFunctionBegin; 219674ae819SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 220674ae819SStefano Zampini /* create work vector for the operator */ 22134a97f8cSStefano Zampini ierr = VecDestroy(&pcbddc->work_scaling);CHKERRQ(ierr); 222674ae819SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&pcbddc->work_scaling);CHKERRQ(ierr); 22334a97f8cSStefano Zampini /* always rebuild pcis->D */ 22428d874f6SStefano Zampini if (pcis->use_stiffness_scaling) { 225674ae819SStefano Zampini ierr = MatGetDiagonal(pcbddc->local_mat,pcis->vec1_N);CHKERRQ(ierr); 226674ae819SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 227674ae819SStefano Zampini ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 228674ae819SStefano Zampini } 229674ae819SStefano Zampini ierr = VecCopy(pcis->D,pcis->vec1_B);CHKERRQ(ierr); 230674ae819SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 231674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 232674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 233674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 234674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 235674ae819SStefano Zampini ierr = VecPointwiseDivide(pcis->D,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 236674ae819SStefano Zampini /* now setup */ 237681e7c04SStefano Zampini if (pcbddc->use_deluxe_scaling) { 23834a97f8cSStefano Zampini if (!pcbddc->deluxe_ctx) { 23934a97f8cSStefano Zampini ierr = PCBDDCScalingCreate_Deluxe(pc);CHKERRQ(ierr); 24034a97f8cSStefano Zampini } 24134a97f8cSStefano Zampini ierr = PCBDDCScalingSetUp_Deluxe(pc);CHKERRQ(ierr); 242674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingRestriction_C",PCBDDCScalingRestriction_Deluxe);CHKERRQ(ierr); 243674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingExtension_C",PCBDDCScalingExtension_Deluxe);CHKERRQ(ierr); 244674ae819SStefano Zampini } else { 245674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingRestriction_C",PCBDDCScalingRestriction_Basic);CHKERRQ(ierr); 246674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingExtension_C",PCBDDCScalingExtension_Basic);CHKERRQ(ierr); 247674ae819SStefano Zampini } 24834a97f8cSStefano Zampini 249674ae819SStefano Zampini /* test */ 250674ae819SStefano Zampini if (pcbddc->dbg_flag) { 25134a97f8cSStefano Zampini Vec vec2_global; 252674ae819SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 25334a97f8cSStefano Zampini PetscReal error; 254674ae819SStefano Zampini 255674ae819SStefano Zampini /* extension -> from local to parallel */ 25634a97f8cSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 25734a97f8cSStefano Zampini ierr = VecSetRandom(pcis->vec1_B,NULL);CHKERRQ(ierr); 25834a97f8cSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 25934a97f8cSStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 26034a97f8cSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&vec2_global);CHKERRQ(ierr); 26134a97f8cSStefano Zampini ierr = VecCopy(pcis->vec1_global,vec2_global);CHKERRQ(ierr); 26234a97f8cSStefano Zampini 263674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 264674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 265674ae819SStefano Zampini ierr = PCBDDCScalingExtension(pc,pcis->vec1_B,pcis->vec1_global);CHKERRQ(ierr); 26634a97f8cSStefano Zampini ierr = VecAXPY(pcis->vec1_global,-1.0,vec2_global);CHKERRQ(ierr); 26734a97f8cSStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&error);CHKERRQ(ierr); 268674ae819SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Error scaling extension %1.14e\n",error);CHKERRQ(ierr); 26934a97f8cSStefano Zampini if (error>1.e-8 && pcbddc->dbg_flag>1) { 270674ae819SStefano Zampini ierr = VecView(pcis->vec1_global,viewer);CHKERRQ(ierr); 271674ae819SStefano Zampini } 27234a97f8cSStefano Zampini ierr = VecDestroy(&vec2_global);CHKERRQ(ierr); 27334a97f8cSStefano Zampini 274674ae819SStefano Zampini /* restriction -> from parallel to local */ 275674ae819SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 27634a97f8cSStefano Zampini ierr = VecSetRandom(pcis->vec1_B,NULL);CHKERRQ(ierr); 277674ae819SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 278674ae819SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 27934a97f8cSStefano Zampini 28034a97f8cSStefano Zampini ierr = PCBDDCScalingRestriction(pc,pcis->vec1_global,pcis->vec1_B);CHKERRQ(ierr); 28134a97f8cSStefano Zampini ierr = VecScale(pcis->vec1_B,-1.0);CHKERRQ(ierr); 28234a97f8cSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 28334a97f8cSStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 28434a97f8cSStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&error);CHKERRQ(ierr); 28534a97f8cSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Error scaling restriction %1.14e\n",error);CHKERRQ(ierr); 28634a97f8cSStefano Zampini if (error>1.e-8 && pcbddc->dbg_flag>1) { 287674ae819SStefano Zampini ierr = VecView(pcis->vec1_global,viewer);CHKERRQ(ierr); 288674ae819SStefano Zampini } 289674ae819SStefano Zampini } 290674ae819SStefano Zampini PetscFunctionReturn(0); 291674ae819SStefano Zampini } 292674ae819SStefano Zampini 293674ae819SStefano Zampini #undef __FUNCT__ 294674ae819SStefano Zampini #define __FUNCT__ "PCBDDCScalingDestroy" 295674ae819SStefano Zampini PetscErrorCode PCBDDCScalingDestroy(PC pc) 296674ae819SStefano Zampini { 297674ae819SStefano Zampini PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 298674ae819SStefano Zampini PetscErrorCode ierr; 299674ae819SStefano Zampini 300674ae819SStefano Zampini PetscFunctionBegin; 30134a97f8cSStefano Zampini if (pcbddc->deluxe_ctx) { 30234a97f8cSStefano Zampini ierr = PCBDDCScalingDestroy_Deluxe(pc);CHKERRQ(ierr); 303674ae819SStefano Zampini } 304674ae819SStefano Zampini ierr = VecDestroy(&pcbddc->work_scaling);CHKERRQ(ierr); 305674ae819SStefano Zampini /* remove functions */ 306674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingRestriction_C",NULL);CHKERRQ(ierr); 307674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingExtension_C",NULL);CHKERRQ(ierr); 308674ae819SStefano Zampini PetscFunctionReturn(0); 309674ae819SStefano Zampini } 310674ae819SStefano Zampini 31134a97f8cSStefano Zampini #undef __FUNCT__ 31234a97f8cSStefano Zampini #define __FUNCT__ "PCBDDCScalingCreate_Deluxe" 31334a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingCreate_Deluxe(PC pc) 31434a97f8cSStefano Zampini { 31534a97f8cSStefano Zampini PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 31634a97f8cSStefano Zampini PCBDDCDeluxeScaling deluxe_ctx; 31734a97f8cSStefano Zampini PetscErrorCode ierr; 31834a97f8cSStefano Zampini 31934a97f8cSStefano Zampini PetscFunctionBegin; 32034a97f8cSStefano Zampini ierr = PetscNew(&deluxe_ctx);CHKERRQ(ierr); 32134a97f8cSStefano Zampini pcbddc->deluxe_ctx = deluxe_ctx; 32234a97f8cSStefano Zampini PetscFunctionReturn(0); 32334a97f8cSStefano Zampini } 32434a97f8cSStefano Zampini 32534a97f8cSStefano Zampini #undef __FUNCT__ 32634a97f8cSStefano Zampini #define __FUNCT__ "PCBDDCScalingDestroy_Deluxe" 32734a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingDestroy_Deluxe(PC pc) 32834a97f8cSStefano Zampini { 32934a97f8cSStefano Zampini PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 33034a97f8cSStefano Zampini PetscErrorCode ierr; 33134a97f8cSStefano Zampini 33234a97f8cSStefano Zampini PetscFunctionBegin; 33334a97f8cSStefano Zampini ierr = PCBDDCScalingReset_Deluxe_Solvers(pcbddc->deluxe_ctx);CHKERRQ(ierr); 33434a97f8cSStefano Zampini ierr = PetscFree(pcbddc->deluxe_ctx);CHKERRQ(ierr); 33534a97f8cSStefano Zampini PetscFunctionReturn(0); 33634a97f8cSStefano Zampini } 33734a97f8cSStefano Zampini 33834a97f8cSStefano Zampini #undef __FUNCT__ 33934a97f8cSStefano Zampini #define __FUNCT__ "PCBDDCScalingReset_Deluxe_Solvers" 34034a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingReset_Deluxe_Solvers(PCBDDCDeluxeScaling deluxe_ctx) 34134a97f8cSStefano Zampini { 34234a97f8cSStefano Zampini PetscErrorCode ierr; 34334a97f8cSStefano Zampini 34434a97f8cSStefano Zampini PetscFunctionBegin; 34534a97f8cSStefano Zampini ierr = PetscFree(deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 34634a97f8cSStefano Zampini deluxe_ctx->n_simple = 0; 34741c3ba1bSStefano Zampini if (deluxe_ctx->seq_ksp) { 34834a97f8cSStefano Zampini ierr = VecScatterDestroy(&deluxe_ctx->seq_scctx);CHKERRQ(ierr); 34934a97f8cSStefano Zampini ierr = VecDestroy(&deluxe_ctx->seq_work1);CHKERRQ(ierr); 35034a97f8cSStefano Zampini ierr = VecDestroy(&deluxe_ctx->seq_work2);CHKERRQ(ierr); 35134a97f8cSStefano Zampini ierr = KSPDestroy(&deluxe_ctx->seq_ksp);CHKERRQ(ierr); 35234a97f8cSStefano Zampini } 35334a97f8cSStefano Zampini if (deluxe_ctx->par_colors) { 35434a97f8cSStefano Zampini PetscInt i; 35534a97f8cSStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 35634a97f8cSStefano Zampini ierr = VecScatterDestroy(&deluxe_ctx->par_scctx_s[i]);CHKERRQ(ierr); 35734a97f8cSStefano Zampini ierr = VecScatterDestroy(&deluxe_ctx->par_scctx_p[i]);CHKERRQ(ierr); 35834a97f8cSStefano Zampini ierr = VecDestroy(&deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 359b96c3477SStefano Zampini ierr = VecDestroy(&deluxe_ctx->par_work1[i]);CHKERRQ(ierr); 360b96c3477SStefano Zampini ierr = VecDestroy(&deluxe_ctx->par_work2[i]);CHKERRQ(ierr); 36134a97f8cSStefano Zampini ierr = KSPDestroy(&deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 36234a97f8cSStefano Zampini } 363b96c3477SStefano Zampini ierr = PetscFree7(deluxe_ctx->par_ksp, 36434a97f8cSStefano Zampini deluxe_ctx->par_scctx_s, 36534a97f8cSStefano Zampini deluxe_ctx->par_scctx_p, 36634a97f8cSStefano Zampini deluxe_ctx->par_vec, 367b96c3477SStefano Zampini deluxe_ctx->par_work1, 368b96c3477SStefano Zampini deluxe_ctx->par_work2, 36934a97f8cSStefano Zampini deluxe_ctx->par_col2sub);CHKERRQ(ierr); 37034a97f8cSStefano Zampini } 37134a97f8cSStefano Zampini deluxe_ctx->par_colors = 0; 37234a97f8cSStefano Zampini PetscFunctionReturn(0); 37334a97f8cSStefano Zampini } 37434a97f8cSStefano Zampini 37534a97f8cSStefano Zampini #undef __FUNCT__ 37634a97f8cSStefano Zampini #define __FUNCT__ "PCBDDCScalingSetUp_Deluxe" 37734a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingSetUp_Deluxe(PC pc) 37834a97f8cSStefano Zampini { 37934a97f8cSStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 38034a97f8cSStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 38134a97f8cSStefano Zampini PCBDDCDeluxeScaling deluxe_ctx=pcbddc->deluxe_ctx; 382b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs=pcbddc->sub_schurs; 383*1b968477SStefano Zampini IS dirIS; 38434a97f8cSStefano Zampini PetscErrorCode ierr; 38534a97f8cSStefano Zampini 38634a97f8cSStefano Zampini PetscFunctionBegin; 387b96c3477SStefano Zampini /* (TODO: reuse) throw away the solvers */ 38834a97f8cSStefano Zampini ierr = PCBDDCScalingReset_Deluxe_Solvers(deluxe_ctx);CHKERRQ(ierr); 38934a97f8cSStefano Zampini 390b1b3d7a2SStefano Zampini /* Compute data structures to solve parallel problems */ 391b1b3d7a2SStefano Zampini ierr = PCBDDCScalingSetUp_Deluxe_Par(pc,sub_schurs->n_subs_par,sub_schurs->n_subs_par_g, 392b1b3d7a2SStefano Zampini sub_schurs->auxglobal_parallel, 393b1b3d7a2SStefano Zampini sub_schurs->index_parallel);CHKERRQ(ierr); 394b96c3477SStefano Zampini 395b1b3d7a2SStefano Zampini /* Compute data structures to solve sequential problems */ 396883469d8SStefano Zampini ierr = PCBDDCScalingSetUp_Deluxe_Seq(pc);CHKERRQ(ierr); 3975db18549SStefano Zampini 398b1b3d7a2SStefano Zampini /* diagonal scaling on interface dofs not contained in cc */ 399*1b968477SStefano Zampini dirIS = NULL; 400*1b968477SStefano Zampini if (pcbddc->DirichletBoundariesLocal) { 401*1b968477SStefano Zampini ierr = PCBDDCGraphGetDirichletDofs(pcbddc->mat_graph,&dirIS);CHKERRQ(ierr); 402*1b968477SStefano Zampini } 403*1b968477SStefano Zampini if (sub_schurs->is_Ej_com || dirIS) { 404*1b968477SStefano Zampini PetscInt n_com,n_dir; 405*1b968477SStefano Zampini n_com = 0; 406*1b968477SStefano Zampini if (sub_schurs->is_Ej_com) { 407*1b968477SStefano Zampini ierr = ISGetLocalSize(sub_schurs->is_Ej_com,&n_com);CHKERRQ(ierr); 408*1b968477SStefano Zampini } 409*1b968477SStefano Zampini n_dir = 0; 410*1b968477SStefano Zampini if (dirIS) { 411*1b968477SStefano Zampini ierr = ISGetLocalSize(dirIS,&n_dir);CHKERRQ(ierr); 412*1b968477SStefano Zampini } 413*1b968477SStefano Zampini deluxe_ctx->n_simple = n_dir + n_com; 414*1b968477SStefano Zampini ierr = PetscMalloc1(deluxe_ctx->n_simple,&deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 4159bb4a8caSStefano Zampini if (sub_schurs->is_Ej_com) { 4169bb4a8caSStefano Zampini PetscInt nmap; 4179bb4a8caSStefano Zampini const PetscInt *idxs; 418*1b968477SStefano Zampini 4199bb4a8caSStefano Zampini ierr = ISGetIndices(sub_schurs->is_Ej_com,&idxs);CHKERRQ(ierr); 420*1b968477SStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,n_com,idxs,&nmap,deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 421*1b968477SStefano Zampini if (nmap != n_com) { 422*1b968477SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error when mapping simply scaled dofs (is_Ej_com)! %d != %d",nmap,n_com); 4239bb4a8caSStefano Zampini } 4249bb4a8caSStefano Zampini ierr = ISRestoreIndices(sub_schurs->is_Ej_com,&idxs);CHKERRQ(ierr); 425*1b968477SStefano Zampini } 426*1b968477SStefano Zampini if (dirIS) { 427*1b968477SStefano Zampini PetscInt nmap; 428*1b968477SStefano Zampini const PetscInt *idxs; 429*1b968477SStefano Zampini 430*1b968477SStefano Zampini ierr = ISGetIndices(dirIS,&idxs);CHKERRQ(ierr); 431*1b968477SStefano Zampini ierr = ISGlobalToLocalMappingApply(pcis->BtoNmap,IS_GTOLM_DROP,n_dir,idxs,&nmap,deluxe_ctx->idx_simple_B+n_com);CHKERRQ(ierr); 432*1b968477SStefano Zampini ierr = ISRestoreIndices(dirIS,&idxs);CHKERRQ(ierr); 433*1b968477SStefano Zampini } 434*1b968477SStefano Zampini ierr = PetscSortInt(deluxe_ctx->n_simple,deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 4359bb4a8caSStefano Zampini } else { 436b1b3d7a2SStefano Zampini deluxe_ctx->n_simple = 0; 4379bb4a8caSStefano Zampini deluxe_ctx->idx_simple_B = 0; 438b1b3d7a2SStefano Zampini } 439*1b968477SStefano Zampini ierr = ISDestroy(&dirIS);CHKERRQ(ierr); 440*1b968477SStefano Zampini 44134a97f8cSStefano Zampini PetscFunctionReturn(0); 44234a97f8cSStefano Zampini } 44334a97f8cSStefano Zampini 44434a97f8cSStefano Zampini #undef __FUNCT__ 44534a97f8cSStefano Zampini #define __FUNCT__ "PCBDDCScalingSetUp_Deluxe_Par" 44634a97f8cSStefano Zampini static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Par(PC pc, PetscInt n_local_parallel_problems,PetscInt n_parallel_problems,PetscInt global_parallel[],PetscInt index_parallel[]) 44734a97f8cSStefano Zampini { 44834a97f8cSStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 44934a97f8cSStefano Zampini PCBDDCDeluxeScaling deluxe_ctx=pcbddc->deluxe_ctx; 45034a97f8cSStefano Zampini /* coloring */ 45134a97f8cSStefano Zampini Mat parallel_problems; 45234a97f8cSStefano Zampini MatColoring coloring_obj; 45334a97f8cSStefano Zampini ISColoring coloring_parallel_problems; 45434a97f8cSStefano Zampini IS *par_is_colors,*is_colors; 45534a97f8cSStefano Zampini /* working stuff */ 45634a97f8cSStefano Zampini PetscInt i,j; 45734a97f8cSStefano Zampini PetscErrorCode ierr; 45834a97f8cSStefano Zampini 45934a97f8cSStefano Zampini PetscFunctionBegin; 46034a97f8cSStefano Zampini if (!n_parallel_problems) { 46134a97f8cSStefano Zampini PetscFunctionReturn(0); 46234a97f8cSStefano Zampini } 46334a97f8cSStefano Zampini /* Color parallel subproblems */ 46434a97f8cSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)pc),¶llel_problems);CHKERRQ(ierr); 46534a97f8cSStefano Zampini ierr = MatSetSizes(parallel_problems,PETSC_DECIDE,PETSC_DECIDE,n_parallel_problems,n_parallel_problems);CHKERRQ(ierr); 46634a97f8cSStefano Zampini ierr = MatSetType(parallel_problems,MATAIJ);CHKERRQ(ierr); 46734a97f8cSStefano Zampini ierr = MatSetUp(parallel_problems);CHKERRQ(ierr); 46834a97f8cSStefano Zampini ierr = MatSetOption(parallel_problems,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 46934a97f8cSStefano Zampini ierr = MatSetOption(parallel_problems,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 47034a97f8cSStefano Zampini for (i=0;i<n_local_parallel_problems;i++) { 47134a97f8cSStefano Zampini PetscInt row = global_parallel[i]; 47234a97f8cSStefano Zampini for (j=0;j<n_local_parallel_problems;j++) { 47334a97f8cSStefano Zampini PetscInt col = global_parallel[j]; 47434a97f8cSStefano Zampini if (row != col) { 47534a97f8cSStefano Zampini ierr = MatSetValue(parallel_problems,row,col,1.0,INSERT_VALUES);CHKERRQ(ierr); 47634a97f8cSStefano Zampini } 47734a97f8cSStefano Zampini } 47834a97f8cSStefano Zampini } 47934a97f8cSStefano Zampini ierr = MatAssemblyBegin(parallel_problems,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 48034a97f8cSStefano Zampini ierr = MatAssemblyEnd(parallel_problems,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 48134a97f8cSStefano Zampini if (pcbddc->dbg_flag > 1) { 48234a97f8cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 48334a97f8cSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Adj matrix for deluxe parallel problems\n");CHKERRQ(ierr); 48434a97f8cSStefano Zampini ierr = MatView(parallel_problems,pcbddc->dbg_viewer);CHKERRQ(ierr); 48534a97f8cSStefano Zampini } 48634a97f8cSStefano Zampini ierr = MatColoringCreate(parallel_problems,&coloring_obj);CHKERRQ(ierr); 48734a97f8cSStefano Zampini ierr = MatColoringSetDistance(coloring_obj,1);CHKERRQ(ierr); 48834a97f8cSStefano Zampini ierr = MatColoringSetType(coloring_obj,MATCOLORINGJP);CHKERRQ(ierr); 48934a97f8cSStefano Zampini ierr = MatColoringApply(coloring_obj,&coloring_parallel_problems);CHKERRQ(ierr); 49034a97f8cSStefano Zampini ierr = ISColoringGetIS(coloring_parallel_problems,&deluxe_ctx->par_colors,&par_is_colors);CHKERRQ(ierr); 49134a97f8cSStefano Zampini if (pcbddc->dbg_flag) { 49234a97f8cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 49334a97f8cSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Number of colors %d for parallel part of deluxe\n",deluxe_ctx->par_colors);CHKERRQ(ierr); 49434a97f8cSStefano Zampini } 49534a97f8cSStefano Zampini 49634a97f8cSStefano Zampini /* all procs should know the color distribution */ 49734a97f8cSStefano Zampini ierr = PetscMalloc1(deluxe_ctx->par_colors,&is_colors);CHKERRQ(ierr); 49834a97f8cSStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 49934a97f8cSStefano Zampini if (pcbddc->dbg_flag) { 50034a97f8cSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Global problem indexes for color %d\n",i);CHKERRQ(ierr); 50134a97f8cSStefano Zampini ierr = ISView(par_is_colors[i],pcbddc->dbg_viewer);CHKERRQ(ierr); 50234a97f8cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 50334a97f8cSStefano Zampini } 50434a97f8cSStefano Zampini ierr = ISAllGather(par_is_colors[i],&is_colors[i]);CHKERRQ(ierr); 50534a97f8cSStefano Zampini } 50634a97f8cSStefano Zampini 50734a97f8cSStefano Zampini /* free unneeded objects */ 50834a97f8cSStefano Zampini ierr = ISColoringRestoreIS(coloring_parallel_problems,&par_is_colors);CHKERRQ(ierr); 50934a97f8cSStefano Zampini ierr = ISColoringDestroy(&coloring_parallel_problems);CHKERRQ(ierr); 51034a97f8cSStefano Zampini ierr = MatColoringDestroy(&coloring_obj);CHKERRQ(ierr); 51134a97f8cSStefano Zampini ierr = MatDestroy(¶llel_problems);CHKERRQ(ierr); 51234a97f8cSStefano Zampini 51334a97f8cSStefano Zampini /* allocate deluxe arrays for parallel problems */ 514b96c3477SStefano Zampini ierr = PetscCalloc7(deluxe_ctx->par_colors,&deluxe_ctx->par_ksp, 51534a97f8cSStefano Zampini deluxe_ctx->par_colors,&deluxe_ctx->par_scctx_s, 51634a97f8cSStefano Zampini deluxe_ctx->par_colors,&deluxe_ctx->par_scctx_p, 51734a97f8cSStefano Zampini deluxe_ctx->par_colors,&deluxe_ctx->par_vec, 518b96c3477SStefano Zampini deluxe_ctx->par_colors,&deluxe_ctx->par_work1, 519b96c3477SStefano Zampini deluxe_ctx->par_colors,&deluxe_ctx->par_work2, 52034a97f8cSStefano Zampini deluxe_ctx->par_colors,&deluxe_ctx->par_col2sub);CHKERRQ(ierr); 52134a97f8cSStefano Zampini 52234a97f8cSStefano Zampini /* cycle on colors */ 52334a97f8cSStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 52434a97f8cSStefano Zampini PetscSubcomm par_subcomm; 52534a97f8cSStefano Zampini const PetscInt* idxs_subproblems; 52634a97f8cSStefano Zampini PetscInt color_size; 52734a97f8cSStefano Zampini PetscMPIInt rank,active_color; 52834a97f8cSStefano Zampini 52934a97f8cSStefano Zampini /* get local index of i-th parallel colored problem */ 53034a97f8cSStefano Zampini ierr = ISGetLocalSize(is_colors[i],&color_size);CHKERRQ(ierr); 53134a97f8cSStefano Zampini ierr = ISGetIndices(is_colors[i],&idxs_subproblems);CHKERRQ(ierr); 53234a97f8cSStefano Zampini /* split comm for computing parallel problems for this color */ 53334a97f8cSStefano Zampini /* Processes not partecipating at this stage will have color = color_size */ 53434a97f8cSStefano Zampini /* because PetscCommDuplicate does not handle MPI_COMM_NULL */ 53534a97f8cSStefano Zampini active_color = color_size; 53634a97f8cSStefano Zampini deluxe_ctx->par_col2sub[i] = -1; 53734a97f8cSStefano Zampini for (j=0;j<n_local_parallel_problems;j++) { 53834a97f8cSStefano Zampini PetscInt local_idx; 53934a97f8cSStefano Zampini ierr = PetscFindInt(global_parallel[j],color_size,idxs_subproblems,&local_idx);CHKERRQ(ierr); 54034a97f8cSStefano Zampini if (local_idx > -1) { 54134a97f8cSStefano Zampini ierr = PetscMPIIntCast(local_idx,&active_color);CHKERRQ(ierr); 54234a97f8cSStefano Zampini deluxe_ctx->par_col2sub[i] = index_parallel[j]; 54334a97f8cSStefano Zampini break; 54434a97f8cSStefano Zampini } 54534a97f8cSStefano Zampini } 54634a97f8cSStefano Zampini ierr = ISRestoreIndices(is_colors[i],&idxs_subproblems);CHKERRQ(ierr); 54734a97f8cSStefano Zampini ierr = PetscSubcommCreate(PetscObjectComm((PetscObject)pc),&par_subcomm);CHKERRQ(ierr); 54834a97f8cSStefano Zampini ierr = PetscSubcommSetNumber(par_subcomm,color_size+1);CHKERRQ(ierr); 54934a97f8cSStefano Zampini ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)pc),&rank);CHKERRQ(ierr); 55034a97f8cSStefano Zampini ierr = PetscSubcommSetTypeGeneral(par_subcomm,active_color,rank);CHKERRQ(ierr); 55134a97f8cSStefano Zampini /* print debug info */ 55234a97f8cSStefano Zampini if (pcbddc->dbg_flag) { 55334a97f8cSStefano Zampini PetscMPIInt crank,csize; 55434a97f8cSStefano Zampini ierr = MPI_Comm_rank(par_subcomm->comm,&crank);CHKERRQ(ierr); 55534a97f8cSStefano Zampini ierr = MPI_Comm_size(par_subcomm->comm,&csize);CHKERRQ(ierr); 55634a97f8cSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Color %d: size %d, details follows.\n",i,color_size);CHKERRQ(ierr); 55734a97f8cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 55834a97f8cSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 55934a97f8cSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," Subdomain %d: color in subcomm %d (rank %d out of %d) (lidx %d)\n",PetscGlobalRank,par_subcomm->color,crank,csize,deluxe_ctx->par_col2sub[i]);CHKERRQ(ierr); 56034a97f8cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 56134a97f8cSStefano Zampini } 56234a97f8cSStefano Zampini 56334a97f8cSStefano Zampini if (deluxe_ctx->par_col2sub[i] >= 0) { 5645e8657edSStefano Zampini PC pctemp; 5655e8657edSStefano Zampini PC_IS *pcis=(PC_IS*)pc->data; 56634a97f8cSStefano Zampini Mat color_mat,color_mat_is,temp_mat; 56734a97f8cSStefano Zampini ISLocalToGlobalMapping WtoNmap,l2gmap_subset; 56834a97f8cSStefano Zampini IS is_local_numbering,isB_local,isW_local,isW; 569b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 57034a97f8cSStefano Zampini PetscInt subidx,n_local_dofs,n_global_dofs; 57134a97f8cSStefano Zampini PetscInt *global_numbering,*local_numbering; 57234a97f8cSStefano Zampini char ksp_prefix[256]; 57334a97f8cSStefano Zampini size_t len; 57434a97f8cSStefano Zampini 57534a97f8cSStefano Zampini /* Local index for schur complement on subset */ 57634a97f8cSStefano Zampini subidx = deluxe_ctx->par_col2sub[i]; 57734a97f8cSStefano Zampini 57834a97f8cSStefano Zampini /* Parallel numbering for dofs in colored subset */ 579b96c3477SStefano Zampini ierr = ISSum(sub_schurs->is_I_layer,sub_schurs->is_subs[subidx],&is_local_numbering);CHKERRQ(ierr); 58034a97f8cSStefano Zampini ierr = ISGetLocalSize(is_local_numbering,&n_local_dofs);CHKERRQ(ierr); 58134a97f8cSStefano Zampini ierr = ISGetIndices(is_local_numbering,(const PetscInt **)&local_numbering);CHKERRQ(ierr); 58234a97f8cSStefano Zampini ierr = PCBDDCSubsetNumbering(par_subcomm->comm,pcbddc->mat_graph->l2gmap,n_local_dofs,local_numbering,PETSC_NULL,&n_global_dofs,&global_numbering);CHKERRQ(ierr); 58334a97f8cSStefano Zampini ierr = ISRestoreIndices(is_local_numbering,(const PetscInt **)&local_numbering);CHKERRQ(ierr); 58434a97f8cSStefano Zampini 58534a97f8cSStefano Zampini /* L2Gmap from relevant dofs to local dofs */ 58634a97f8cSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_local_numbering,&WtoNmap);CHKERRQ(ierr); 58734a97f8cSStefano Zampini 58834a97f8cSStefano Zampini /* L2Gmap from local to global dofs */ 58934a97f8cSStefano Zampini ierr = ISLocalToGlobalMappingCreate(par_subcomm->comm,1,n_local_dofs,global_numbering,PETSC_COPY_VALUES,&l2gmap_subset);CHKERRQ(ierr); 59034a97f8cSStefano Zampini 59134a97f8cSStefano Zampini /* compute parallel matrix (extended dirichlet problem on subset) */ 59234a97f8cSStefano Zampini ierr = MatCreateIS(par_subcomm->comm,1,PETSC_DECIDE,PETSC_DECIDE,n_global_dofs,n_global_dofs,l2gmap_subset,&color_mat_is);CHKERRQ(ierr); 59334a97f8cSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_local_numbering,is_local_numbering,MAT_INITIAL_MATRIX,&temp_mat);CHKERRQ(ierr); 59434a97f8cSStefano Zampini ierr = MatISSetLocalMat(color_mat_is,temp_mat);CHKERRQ(ierr); 59534a97f8cSStefano Zampini ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 59634a97f8cSStefano Zampini ierr = MatISGetMPIXAIJ(color_mat_is,MAT_INITIAL_MATRIX,&color_mat);CHKERRQ(ierr); 59734a97f8cSStefano Zampini ierr = MatDestroy(&color_mat_is);CHKERRQ(ierr); 59834a97f8cSStefano Zampini 59934a97f8cSStefano Zampini /* work vector for (parallel) extended dirichlet problem */ 6008a26ef87SStefano Zampini ierr = MatCreateVecs(color_mat,&deluxe_ctx->par_vec[i],NULL);CHKERRQ(ierr); 60134a97f8cSStefano Zampini 60234a97f8cSStefano Zampini /* compute scatters */ 60334a97f8cSStefano Zampini /* deluxe_ctx->par_scctx_p[i] extension from local subset to extended dirichlet problem 60434a97f8cSStefano Zampini deluxe_ctx->par_scctx_s[i] restriction from local boundary to subset -> simple copy of selected values */ 605b96c3477SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(pcis->BtoNmap,IS_GTOLM_DROP,sub_schurs->is_subs[subidx],&isB_local);CHKERRQ(ierr); 606b96c3477SStefano Zampini ierr = MatCreateVecs(sub_schurs->S_Ej[subidx],&deluxe_ctx->par_work1[i],&deluxe_ctx->par_work2[i]);CHKERRQ(ierr); 607b96c3477SStefano Zampini ierr = VecScatterCreate(pcbddc->work_scaling,isB_local,deluxe_ctx->par_work1[i],NULL,&deluxe_ctx->par_scctx_s[i]);CHKERRQ(ierr); 608b96c3477SStefano Zampini ierr = ISGlobalToLocalMappingApplyIS(WtoNmap,IS_GTOLM_DROP,sub_schurs->is_subs[subidx],&isW_local);CHKERRQ(ierr); 60934a97f8cSStefano Zampini ierr = ISLocalToGlobalMappingApplyIS(l2gmap_subset,isW_local,&isW);CHKERRQ(ierr); 610b96c3477SStefano Zampini ierr = VecScatterCreate(deluxe_ctx->par_work1[i],NULL,deluxe_ctx->par_vec[i],isW,&deluxe_ctx->par_scctx_p[i]);CHKERRQ(ierr); 61134a97f8cSStefano Zampini 61234a97f8cSStefano Zampini /* free objects no longer neeeded */ 61334a97f8cSStefano Zampini ierr = ISDestroy(&isW);CHKERRQ(ierr); 61434a97f8cSStefano Zampini ierr = ISDestroy(&isW_local);CHKERRQ(ierr); 61534a97f8cSStefano Zampini ierr = ISDestroy(&isB_local);CHKERRQ(ierr); 61634a97f8cSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&WtoNmap);CHKERRQ(ierr); 61734a97f8cSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&l2gmap_subset);CHKERRQ(ierr); 61834a97f8cSStefano Zampini ierr = ISDestroy(&is_local_numbering);CHKERRQ(ierr); 61934a97f8cSStefano Zampini ierr = PetscFree(global_numbering);CHKERRQ(ierr); 62034a97f8cSStefano Zampini 62134a97f8cSStefano Zampini /* KSP for extended dirichlet problem */ 62234a97f8cSStefano Zampini ierr = KSPCreate(par_subcomm->comm,&deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 62334a97f8cSStefano Zampini ierr = KSPSetOperators(deluxe_ctx->par_ksp[i],color_mat,color_mat);CHKERRQ(ierr); 62434a97f8cSStefano Zampini ierr = KSPSetTolerances(deluxe_ctx->par_ksp[i],1.e-12,1.e-12,1.e10,10000);CHKERRQ(ierr); 62534a97f8cSStefano Zampini ierr = KSPSetType(deluxe_ctx->par_ksp[i],KSPPREONLY);CHKERRQ(ierr); 6265e8657edSStefano Zampini ierr = KSPGetPC(deluxe_ctx->par_ksp[i],&pctemp);CHKERRQ(ierr); 6275e8657edSStefano Zampini ierr = PCSetType(pctemp,PCREDUNDANT);CHKERRQ(ierr); 62834a97f8cSStefano Zampini ierr = PetscStrlen(((PetscObject)(pcbddc->ksp_D))->prefix,&len);CHKERRQ(ierr); 6298856534dSStefano Zampini len -= 10; /* remove "dirichlet_" */ 6308856534dSStefano Zampini ierr = PetscStrncpy(ksp_prefix,((PetscObject)(pcbddc->ksp_D))->prefix,len+1);CHKERRQ(ierr); /* PetscStrncpy puts a terminating char at the end */ 63134a97f8cSStefano Zampini ierr = PetscStrcat(ksp_prefix,"deluxe_par_");CHKERRQ(ierr); 63234a97f8cSStefano Zampini ierr = KSPSetOptionsPrefix(deluxe_ctx->par_ksp[i],ksp_prefix);CHKERRQ(ierr); 63334a97f8cSStefano Zampini ierr = KSPSetFromOptions(deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 63434a97f8cSStefano Zampini ierr = KSPSetUp(deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 63534a97f8cSStefano Zampini ierr = MatDestroy(&color_mat);CHKERRQ(ierr); 63634a97f8cSStefano Zampini } 63734a97f8cSStefano Zampini ierr = PetscSubcommDestroy(&par_subcomm);CHKERRQ(ierr); 63834a97f8cSStefano Zampini } 63934a97f8cSStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 64034a97f8cSStefano Zampini ierr = ISDestroy(&is_colors[i]);CHKERRQ(ierr); 64134a97f8cSStefano Zampini } 64234a97f8cSStefano Zampini ierr = PetscFree(is_colors);CHKERRQ(ierr); 64334a97f8cSStefano Zampini 64434a97f8cSStefano Zampini if (pcbddc->dbg_flag) { 64534a97f8cSStefano Zampini Vec test_vec; 64634a97f8cSStefano Zampini PetscReal error; 647b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 64834a97f8cSStefano Zampini /* test partition of unity of coloured schur complements */ 64934a97f8cSStefano Zampini for (i=0;i<deluxe_ctx->par_colors;i++) { 65034a97f8cSStefano Zampini PetscInt subidx = deluxe_ctx->par_col2sub[i]; 65134a97f8cSStefano Zampini PetscBool error_found = PETSC_FALSE; 65234a97f8cSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 65334a97f8cSStefano Zampini 65434a97f8cSStefano Zampini if (deluxe_ctx->par_ksp[i]) { 65534a97f8cSStefano Zampini /* create random test vec being zero on internal nodes of the extende dirichlet problem */ 65634a97f8cSStefano Zampini ierr = VecDuplicate(deluxe_ctx->par_vec[i],&test_vec);CHKERRQ(ierr); 657b96c3477SStefano Zampini ierr = VecSetRandom(deluxe_ctx->par_work1[i],PETSC_NULL);CHKERRQ(ierr); 65834a97f8cSStefano Zampini ierr = VecSet(test_vec,0.0);CHKERRQ(ierr); 659b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work1[i],test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 660b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work1[i],test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 66134a97f8cSStefano Zampini /* w_j */ 662b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],test_vec,deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 663b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],test_vec,deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 66434a97f8cSStefano Zampini /* S_j*w_j */ 665b96c3477SStefano Zampini ierr = MatMult(sub_schurs->S_Ej[subidx],deluxe_ctx->par_work1[i],deluxe_ctx->par_work2[i]);CHKERRQ(ierr); 66634a97f8cSStefano Zampini /* \sum_j S_j*w_j */ 66734a97f8cSStefano Zampini ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 668b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work2[i],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 669b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work2[i],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 67034a97f8cSStefano Zampini /* (\sum_j S_j)^(-1)(\sum_j S_j*w_j) */ 67134a97f8cSStefano Zampini ierr = KSPSolve(deluxe_ctx->par_ksp[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 672b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 673b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_work1[i],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 67434a97f8cSStefano Zampini ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 675b96c3477SStefano Zampini ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work1[i],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 676b96c3477SStefano Zampini ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_work1[i],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 67734a97f8cSStefano Zampini /* test partition of unity */ 67834a97f8cSStefano Zampini ierr = VecAXPY(test_vec,-1.0,deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 67934a97f8cSStefano Zampini ierr = VecNorm(test_vec,NORM_INFINITY,&error);CHKERRQ(ierr); 680c63f45b2SStefano Zampini if (PetscAbsReal(error) > 1.e-2) { 68134a97f8cSStefano Zampini /* ierr = VecView(test_vec,0);CHKERRQ(ierr); */ 68234a97f8cSStefano Zampini error_found = PETSC_TRUE; 68334a97f8cSStefano Zampini } 68434a97f8cSStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 68534a97f8cSStefano Zampini } 68634a97f8cSStefano Zampini if (error_found) { 68734a97f8cSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Error testing local schur for color %d and subdomain %d\n",i,PetscGlobalRank);CHKERRQ(ierr); 68834a97f8cSStefano Zampini } 68934a97f8cSStefano Zampini ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 69034a97f8cSStefano Zampini } 69134a97f8cSStefano Zampini } 69234a97f8cSStefano Zampini PetscFunctionReturn(0); 69334a97f8cSStefano Zampini } 69434a97f8cSStefano Zampini 6955db18549SStefano Zampini #undef __FUNCT__ 696883469d8SStefano Zampini #define __FUNCT__ "PCBDDCScalingSetUp_Deluxe_Seq" 697883469d8SStefano Zampini static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Seq(PC pc) 6985db18549SStefano Zampini { 6995db18549SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 7005db18549SStefano Zampini PCBDDCDeluxeScaling deluxe_ctx=pcbddc->deluxe_ctx; 701b96c3477SStefano Zampini PCBDDCSubSchurs sub_schurs = pcbddc->sub_schurs; 7025db18549SStefano Zampini PC pc_temp; 7035db18549SStefano Zampini MatSolverPackage solver=NULL; 7045db18549SStefano Zampini char ksp_prefix[256]; 7055db18549SStefano Zampini size_t len; 7065db18549SStefano Zampini PetscInt local_size; 7075db18549SStefano Zampini PetscErrorCode ierr; 7085db18549SStefano Zampini 7095db18549SStefano Zampini PetscFunctionBegin; 7109221af80SStefano Zampini if (!sub_schurs->n_subs_seq_g) { 7119221af80SStefano Zampini PetscFunctionReturn(0); 7129221af80SStefano Zampini } 7139221af80SStefano Zampini 7145db18549SStefano Zampini /* Create work vectors for sequential part of deluxe */ 71565d8bf0aSStefano Zampini ierr = MatCreateVecs(sub_schurs->sum_S_Ej_all,&deluxe_ctx->seq_work1,&deluxe_ctx->seq_work2);CHKERRQ(ierr); 7165db18549SStefano Zampini 7175db18549SStefano Zampini /* Compute deluxe sequential scatter */ 7185db18549SStefano Zampini ierr = VecScatterCreate(pcbddc->work_scaling,sub_schurs->is_Ej_all,deluxe_ctx->seq_work1,NULL,&deluxe_ctx->seq_scctx);CHKERRQ(ierr); 7195db18549SStefano Zampini 7205db18549SStefano Zampini /* Create KSP object for sequential part of deluxe scaling */ 7215db18549SStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&deluxe_ctx->seq_ksp);CHKERRQ(ierr); 7225db18549SStefano Zampini ierr = KSPSetOperators(deluxe_ctx->seq_ksp,sub_schurs->sum_S_Ej_all,sub_schurs->sum_S_Ej_all);CHKERRQ(ierr); 7235db18549SStefano Zampini ierr = KSPSetType(deluxe_ctx->seq_ksp,KSPPREONLY);CHKERRQ(ierr); 7245db18549SStefano Zampini ierr = KSPGetPC(deluxe_ctx->seq_ksp,&pc_temp);CHKERRQ(ierr); 7255db18549SStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 7265db18549SStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 7275db18549SStefano Zampini ierr = PCFactorGetMatSolverPackage(pc_temp,(const MatSolverPackage*)&solver);CHKERRQ(ierr); 7285db18549SStefano Zampini ierr = MatGetSize(sub_schurs->sum_S_Ej_all,&local_size,NULL);CHKERRQ(ierr); 7295db18549SStefano Zampini if (solver && local_size) { /* if local_size is null, some external packages will report errors */ 7305db18549SStefano Zampini PC new_pc; 7315db18549SStefano Zampini PCType type; 7325db18549SStefano Zampini ierr = PCGetType(pc_temp,&type);CHKERRQ(ierr); 7335db18549SStefano Zampini ierr = KSPGetPC(deluxe_ctx->seq_ksp,&new_pc);CHKERRQ(ierr); 7345db18549SStefano Zampini ierr = PCSetType(new_pc,type);CHKERRQ(ierr); 7355db18549SStefano Zampini ierr = PCFactorSetMatSolverPackage(new_pc,solver);CHKERRQ(ierr); 7365db18549SStefano Zampini } 7375db18549SStefano Zampini ierr = PetscStrlen(((PetscObject)(pcbddc->ksp_D))->prefix,&len);CHKERRQ(ierr); 7385db18549SStefano Zampini len -= 10; /* remove "dirichlet_" */ 7395db18549SStefano Zampini ierr = PetscStrncpy(ksp_prefix,((PetscObject)(pcbddc->ksp_D))->prefix,len+1);CHKERRQ(ierr); 7405db18549SStefano Zampini ierr = PetscStrcat(ksp_prefix,"deluxe_seq_");CHKERRQ(ierr); 7415db18549SStefano Zampini ierr = KSPSetOptionsPrefix(deluxe_ctx->seq_ksp,ksp_prefix);CHKERRQ(ierr); 7425db18549SStefano Zampini if (local_size) { 7435db18549SStefano Zampini ierr = KSPSetFromOptions(deluxe_ctx->seq_ksp);CHKERRQ(ierr); 7445db18549SStefano Zampini } 7455db18549SStefano Zampini ierr = KSPSetUp(deluxe_ctx->seq_ksp);CHKERRQ(ierr); 7465db18549SStefano Zampini PetscFunctionReturn(0); 7475db18549SStefano Zampini } 748