1dba47a55SKris Buschelman 24b9ad928SBarry Smith /* 33f457be1SHong Zhang This file defines a "solve the problem redundantly on each subgroup of processor" preconditioner. 44b9ad928SBarry Smith */ 5af0996ceSBarry Smith #include <petsc/private/pcimpl.h> 6c6db04a5SJed Brown #include <petscksp.h> /*I "petscksp.h" I*/ 74b9ad928SBarry Smith 84b9ad928SBarry Smith typedef struct { 93e065800SHong Zhang KSP ksp; 104b9ad928SBarry Smith PC pc; /* actual preconditioner used on each processor */ 11ce94432eSBarry Smith Vec xsub,ysub; /* vectors of a subcommunicator to hold parallel vectors of PetscObjectComm((PetscObject)pc) */ 123f457be1SHong Zhang Vec xdup,ydup; /* parallel vector that congregates xsub or ysub facilitating vector scattering */ 13b3804887SHong Zhang Mat pmats; /* matrix and optional preconditioner matrix belong to a subcommunicator */ 143f457be1SHong Zhang VecScatter scatterin,scatterout; /* scatter used to move all values to each processor group (subcommunicator) */ 15ace3abfcSBarry Smith PetscBool useparallelmat; 16c540e29cSHong Zhang PetscSubcomm psubcomm; 171fbd8f88SHong Zhang PetscInt nsubcomm; /* num of data structure PetscSubcomm */ 184b9ad928SBarry Smith } PC_Redundant; 194b9ad928SBarry Smith 204b9ad928SBarry Smith #undef __FUNCT__ 214b9ad928SBarry Smith #define __FUNCT__ "PCView_Redundant" 226849ba73SBarry Smith static PetscErrorCode PCView_Redundant(PC pc,PetscViewer viewer) 234b9ad928SBarry Smith { 244b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 25dfbe8321SBarry Smith PetscErrorCode ierr; 26ace3abfcSBarry Smith PetscBool iascii,isstring; 2703ccd0b4SBarry Smith PetscViewer subviewer; 284b9ad928SBarry Smith 294b9ad928SBarry Smith PetscFunctionBegin; 30251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 31251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERSTRING,&isstring);CHKERRQ(ierr); 3232077d6dSBarry Smith if (iascii) { 3303ccd0b4SBarry Smith if (!red->psubcomm) { 3403ccd0b4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," Redundant preconditioner: Not yet setup\n");CHKERRQ(ierr); 3503ccd0b4SBarry Smith } else { 363e065800SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," Redundant preconditioner: First (color=0) of %D PCs follows\n",red->nsubcomm);CHKERRQ(ierr); 373f08860eSBarry Smith ierr = PetscViewerGetSubViewer(viewer,((PetscObject)red->pc)->comm,&subviewer);CHKERRQ(ierr); 38f5dd71faSBarry Smith if (!red->psubcomm->color) { /* only view first redundant pc */ 39*1575c14dSBarry Smith ierr = PetscViewerASCIIPushTab(subviewer);CHKERRQ(ierr); 403e065800SHong Zhang ierr = KSPView(red->ksp,subviewer);CHKERRQ(ierr); 41*1575c14dSBarry Smith ierr = PetscViewerASCIIPopTab(subviewer);CHKERRQ(ierr); 424b9ad928SBarry Smith } 433f08860eSBarry Smith ierr = PetscViewerRestoreSubViewer(viewer,((PetscObject)red->pc)->comm,&subviewer);CHKERRQ(ierr); 444b9ad928SBarry Smith } 4503ccd0b4SBarry Smith } else if (isstring) { 4603ccd0b4SBarry Smith ierr = PetscViewerStringSPrintf(viewer," Redundant solver preconditioner");CHKERRQ(ierr); 474b9ad928SBarry Smith } 484b9ad928SBarry Smith PetscFunctionReturn(0); 494b9ad928SBarry Smith } 504b9ad928SBarry Smith 514b9ad928SBarry Smith #undef __FUNCT__ 524b9ad928SBarry Smith #define __FUNCT__ "PCSetUp_Redundant" 536849ba73SBarry Smith static PetscErrorCode PCSetUp_Redundant(PC pc) 544b9ad928SBarry Smith { 554b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 56dfbe8321SBarry Smith PetscErrorCode ierr; 571b81debcSHong Zhang PetscInt mstart,mend,mlocal,M; 5813f74950SBarry Smith PetscMPIInt size; 59ce94432eSBarry Smith MPI_Comm comm,subcomm; 60ddc54837SHong Zhang Vec x; 611fbd8f88SHong Zhang const char *prefix; 623f457be1SHong Zhang 634b9ad928SBarry Smith PetscFunctionBegin; 64ce94432eSBarry Smith ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 65ddc54837SHong Zhang 66ddc54837SHong Zhang /* if pmatrix set by user is sequential then we do not need to gather the parallel matrix */ 67ddc54837SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 68ddc54837SHong Zhang if (size == 1) red->useparallelmat = PETSC_FALSE; 691fbd8f88SHong Zhang 704b9ad928SBarry Smith if (!pc->setupcalled) { 711b81debcSHong Zhang PetscInt mloc_sub; 725f06b7aaSBarry Smith if (!red->psubcomm) { 73d8a68f86SHong Zhang ierr = PetscSubcommCreate(comm,&red->psubcomm);CHKERRQ(ierr); 74d8a68f86SHong Zhang ierr = PetscSubcommSetNumber(red->psubcomm,red->nsubcomm);CHKERRQ(ierr); 75a23b1e67SHong Zhang ierr = PetscSubcommSetType(red->psubcomm,PETSC_SUBCOMM_CONTIGUOUS);CHKERRQ(ierr); 76a23b1e67SHong Zhang /* enable runtime switch of psubcomm type, e.g., '-psubcomm_type interlaced */ 77a23b1e67SHong Zhang ierr = PetscSubcommSetFromOptions(red->psubcomm);CHKERRQ(ierr); 783bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)pc,sizeof(PetscSubcomm));CHKERRQ(ierr); 791fbd8f88SHong Zhang 801fbd8f88SHong Zhang /* create a new PC that processors in each subcomm have copy of */ 81306c2d5bSBarry Smith subcomm = PetscSubcommChild(red->psubcomm); 822fa5cd67SKarl Rupp 835f06b7aaSBarry Smith ierr = KSPCreate(subcomm,&red->ksp);CHKERRQ(ierr); 84422a814eSBarry Smith ierr = KSPSetErrorIfNotConverged(red->ksp,pc->erroriffailure);CHKERRQ(ierr); 855f06b7aaSBarry Smith ierr = PetscObjectIncrementTabLevel((PetscObject)red->ksp,(PetscObject)pc,1);CHKERRQ(ierr); 863bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)red->ksp);CHKERRQ(ierr); 875f06b7aaSBarry Smith ierr = KSPSetType(red->ksp,KSPPREONLY);CHKERRQ(ierr); 885f06b7aaSBarry Smith ierr = KSPGetPC(red->ksp,&red->pc);CHKERRQ(ierr); 89cf52b8b1SHong Zhang ierr = PCSetType(red->pc,PCLU);CHKERRQ(ierr); 90cf52b8b1SHong Zhang 911fbd8f88SHong Zhang ierr = PCGetOptionsPrefix(pc,&prefix);CHKERRQ(ierr); 925f06b7aaSBarry Smith ierr = KSPSetOptionsPrefix(red->ksp,prefix);CHKERRQ(ierr); 935f06b7aaSBarry Smith ierr = KSPAppendOptionsPrefix(red->ksp,"redundant_");CHKERRQ(ierr); 941b81debcSHong Zhang } else { 95306c2d5bSBarry Smith subcomm = PetscSubcommChild(red->psubcomm); 961b81debcSHong Zhang } 971fbd8f88SHong Zhang 981b81debcSHong Zhang if (red->useparallelmat) { 991b81debcSHong Zhang /* grab the parallel matrix and put it into processors of a subcomminicator */ 10053cd1579SHong Zhang ierr = MatCreateRedundantMatrix(pc->pmat,red->psubcomm->n,subcomm,MAT_INITIAL_MATRIX,&red->pmats);CHKERRQ(ierr); 10123ee1639SBarry Smith ierr = KSPSetOperators(red->ksp,red->pmats,red->pmats);CHKERRQ(ierr); 1024b9ad928SBarry Smith 1031b81debcSHong Zhang /* get working vectors xsub and ysub */ 1042a7a6963SBarry Smith ierr = MatCreateVecs(red->pmats,&red->xsub,&red->ysub);CHKERRQ(ierr); 1052fa5cd67SKarl Rupp 1068b96b0d2SHong Zhang /* create working vectors xdup and ydup. 1078b96b0d2SHong Zhang xdup concatenates all xsub's contigously to form a mpi vector over dupcomm (see PetscSubcommCreate_interlaced()) 1088b96b0d2SHong Zhang ydup concatenates all ysub and has empty local arrays because ysub's arrays will be place into it. 109ce94432eSBarry Smith Note: we use communicator dupcomm, not PetscObjectComm((PetscObject)pc)! */ 1101b81debcSHong Zhang ierr = MatGetLocalSize(red->pmats,&mloc_sub,NULL);CHKERRQ(ierr); 11136be1a5eSBarry Smith ierr = VecCreateMPI(PetscSubcommContiguousParent(red->psubcomm),mloc_sub,PETSC_DECIDE,&red->xdup);CHKERRQ(ierr); 11236be1a5eSBarry Smith ierr = VecCreateMPIWithArray(PetscSubcommContiguousParent(red->psubcomm),1,mloc_sub,PETSC_DECIDE,NULL,&red->ydup);CHKERRQ(ierr); 1133f457be1SHong Zhang 114f68be91cSHong Zhang /* create vecscatters */ 115f68be91cSHong Zhang if (!red->scatterin) { /* efficiency of scatterin is independent from psubcomm_type! */ 1163f457be1SHong Zhang IS is1,is2; 1173f457be1SHong Zhang PetscInt *idx1,*idx2,i,j,k; 11845fc02eaSBarry Smith 1192a7a6963SBarry Smith ierr = MatCreateVecs(pc->pmat,&x,0);CHKERRQ(ierr); 1201b81debcSHong Zhang ierr = VecGetSize(x,&M);CHKERRQ(ierr); 1211b81debcSHong Zhang ierr = VecGetOwnershipRange(x,&mstart,&mend);CHKERRQ(ierr); 1221b81debcSHong Zhang mlocal = mend - mstart; 123dcca6d9dSJed Brown ierr = PetscMalloc2(red->psubcomm->n*mlocal,&idx1,red->psubcomm->n*mlocal,&idx2);CHKERRQ(ierr); 1243f457be1SHong Zhang j = 0; 1251fbd8f88SHong Zhang for (k=0; k<red->psubcomm->n; k++) { 1263f457be1SHong Zhang for (i=mstart; i<mend; i++) { 1273f457be1SHong Zhang idx1[j] = i; 128ddc54837SHong Zhang idx2[j++] = i + M*k; 1293f457be1SHong Zhang } 1303f457be1SHong Zhang } 13170b3c8c7SBarry Smith ierr = ISCreateGeneral(comm,red->psubcomm->n*mlocal,idx1,PETSC_COPY_VALUES,&is1);CHKERRQ(ierr); 13270b3c8c7SBarry Smith ierr = ISCreateGeneral(comm,red->psubcomm->n*mlocal,idx2,PETSC_COPY_VALUES,&is2);CHKERRQ(ierr); 133ddc54837SHong Zhang ierr = VecScatterCreate(x,is1,red->xdup,is2,&red->scatterin);CHKERRQ(ierr); 134fcfd50ebSBarry Smith ierr = ISDestroy(&is1);CHKERRQ(ierr); 135fcfd50ebSBarry Smith ierr = ISDestroy(&is2);CHKERRQ(ierr); 1363f457be1SHong Zhang 1376909748bSHong Zhang /* Impl below is good for PETSC_SUBCOMM_INTERLACED (no inter-process communication) and PETSC_SUBCOMM_CONTIGUOUS (communication within subcomm) */ 138ddc54837SHong Zhang ierr = ISCreateStride(comm,mlocal,mstart+ red->psubcomm->color*M,1,&is1);CHKERRQ(ierr); 1393f457be1SHong Zhang ierr = ISCreateStride(comm,mlocal,mstart,1,&is2);CHKERRQ(ierr); 140ddc54837SHong Zhang ierr = VecScatterCreate(red->xdup,is1,x,is2,&red->scatterout);CHKERRQ(ierr); 141fcfd50ebSBarry Smith ierr = ISDestroy(&is1);CHKERRQ(ierr); 142fcfd50ebSBarry Smith ierr = ISDestroy(&is2);CHKERRQ(ierr); 1431d79065fSBarry Smith ierr = PetscFree2(idx1,idx2);CHKERRQ(ierr); 144ddc54837SHong Zhang ierr = VecDestroy(&x);CHKERRQ(ierr); 1451b81debcSHong Zhang } 146ab661555SHong Zhang } else { /* !red->useparallelmat */ 14723ee1639SBarry Smith ierr = KSPSetOperators(red->ksp,pc->mat,pc->pmat);CHKERRQ(ierr); 1481b81debcSHong Zhang } 149ab661555SHong Zhang } else { /* pc->setupcalled */ 1504b9ad928SBarry Smith if (red->useparallelmat) { 151ab661555SHong Zhang MatReuse reuse; 1521b81debcSHong Zhang /* grab the parallel matrix and put it into processors of a subcomminicator */ 1531b81debcSHong Zhang /*--------------------------------------------------------------------------*/ 154ab661555SHong Zhang if (pc->flag == DIFFERENT_NONZERO_PATTERN) { 1554b9ad928SBarry Smith /* destroy old matrices */ 1566bf464f9SBarry Smith ierr = MatDestroy(&red->pmats);CHKERRQ(ierr); 157ab661555SHong Zhang reuse = MAT_INITIAL_MATRIX; 1584b9ad928SBarry Smith } else { 159ab661555SHong Zhang reuse = MAT_REUSE_MATRIX; 160ab661555SHong Zhang } 161306c2d5bSBarry Smith ierr = MatCreateRedundantMatrix(pc->pmat,red->psubcomm->n,PetscSubcommChild(red->psubcomm),reuse,&red->pmats);CHKERRQ(ierr); 16223ee1639SBarry Smith ierr = KSPSetOperators(red->ksp,red->pmats,red->pmats);CHKERRQ(ierr); 163ab661555SHong Zhang } else { /* !red->useparallelmat */ 16423ee1639SBarry Smith ierr = KSPSetOperators(red->ksp,pc->mat,pc->pmat);CHKERRQ(ierr); 1654b9ad928SBarry Smith } 166ab661555SHong Zhang } 1671b81debcSHong Zhang 1680c24e6a1SHong Zhang if (pc->setfromoptionscalled) { 1693e065800SHong Zhang ierr = KSPSetFromOptions(red->ksp);CHKERRQ(ierr); 1700c24e6a1SHong Zhang } 1713e065800SHong Zhang ierr = KSPSetUp(red->ksp);CHKERRQ(ierr); 1724b9ad928SBarry Smith PetscFunctionReturn(0); 1734b9ad928SBarry Smith } 1744b9ad928SBarry Smith 1754b9ad928SBarry Smith #undef __FUNCT__ 1764b9ad928SBarry Smith #define __FUNCT__ "PCApply_Redundant" 1776849ba73SBarry Smith static PetscErrorCode PCApply_Redundant(PC pc,Vec x,Vec y) 1784b9ad928SBarry Smith { 1794b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 180dfbe8321SBarry Smith PetscErrorCode ierr; 1813f457be1SHong Zhang PetscScalar *array; 1824b9ad928SBarry Smith 1834b9ad928SBarry Smith PetscFunctionBegin; 184ddc54837SHong Zhang if (!red->useparallelmat) { 185ddc54837SHong Zhang ierr = KSPSolve(red->ksp,x,y);CHKERRQ(ierr); 186ddc54837SHong Zhang PetscFunctionReturn(0); 187ddc54837SHong Zhang } 188ddc54837SHong Zhang 1893f457be1SHong Zhang /* scatter x to xdup */ 190ca9f406cSSatish Balay ierr = VecScatterBegin(red->scatterin,x,red->xdup,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 191ca9f406cSSatish Balay ierr = VecScatterEnd(red->scatterin,x,red->xdup,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1923f457be1SHong Zhang 1933f457be1SHong Zhang /* place xdup's local array into xsub */ 1943f457be1SHong Zhang ierr = VecGetArray(red->xdup,&array);CHKERRQ(ierr); 1953f457be1SHong Zhang ierr = VecPlaceArray(red->xsub,(const PetscScalar*)array);CHKERRQ(ierr); 1964b9ad928SBarry Smith 1974b9ad928SBarry Smith /* apply preconditioner on each processor */ 19883ab6a24SBarry Smith ierr = KSPSolve(red->ksp,red->xsub,red->ysub);CHKERRQ(ierr); 1993f457be1SHong Zhang ierr = VecResetArray(red->xsub);CHKERRQ(ierr); 2003f457be1SHong Zhang ierr = VecRestoreArray(red->xdup,&array);CHKERRQ(ierr); 2014b9ad928SBarry Smith 2023f457be1SHong Zhang /* place ysub's local array into ydup */ 2033f457be1SHong Zhang ierr = VecGetArray(red->ysub,&array);CHKERRQ(ierr); 2043f457be1SHong Zhang ierr = VecPlaceArray(red->ydup,(const PetscScalar*)array);CHKERRQ(ierr); 2053f457be1SHong Zhang 2063f457be1SHong Zhang /* scatter ydup to y */ 207ca9f406cSSatish Balay ierr = VecScatterBegin(red->scatterout,red->ydup,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 208ca9f406cSSatish Balay ierr = VecScatterEnd(red->scatterout,red->ydup,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2093f457be1SHong Zhang ierr = VecResetArray(red->ydup);CHKERRQ(ierr); 2103f457be1SHong Zhang ierr = VecRestoreArray(red->ysub,&array);CHKERRQ(ierr); 2114b9ad928SBarry Smith PetscFunctionReturn(0); 2124b9ad928SBarry Smith } 2134b9ad928SBarry Smith 2144b9ad928SBarry Smith #undef __FUNCT__ 215d88bfacbSStefano Zampini #define __FUNCT__ "PCApplyTranspose_Redundant" 216d88bfacbSStefano Zampini static PetscErrorCode PCApplyTranspose_Redundant(PC pc,Vec x,Vec y) 217d88bfacbSStefano Zampini { 218d88bfacbSStefano Zampini PC_Redundant *red = (PC_Redundant*)pc->data; 219d88bfacbSStefano Zampini PetscErrorCode ierr; 220d88bfacbSStefano Zampini PetscScalar *array; 221d88bfacbSStefano Zampini 222d88bfacbSStefano Zampini PetscFunctionBegin; 223d88bfacbSStefano Zampini if (!red->useparallelmat) { 224d88bfacbSStefano Zampini ierr = KSPSolveTranspose(red->ksp,x,y);CHKERRQ(ierr); 225d88bfacbSStefano Zampini PetscFunctionReturn(0); 226d88bfacbSStefano Zampini } 227d88bfacbSStefano Zampini 228d88bfacbSStefano Zampini /* scatter x to xdup */ 229d88bfacbSStefano Zampini ierr = VecScatterBegin(red->scatterin,x,red->xdup,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 230d88bfacbSStefano Zampini ierr = VecScatterEnd(red->scatterin,x,red->xdup,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 231d88bfacbSStefano Zampini 232d88bfacbSStefano Zampini /* place xdup's local array into xsub */ 233d88bfacbSStefano Zampini ierr = VecGetArray(red->xdup,&array);CHKERRQ(ierr); 234d88bfacbSStefano Zampini ierr = VecPlaceArray(red->xsub,(const PetscScalar*)array);CHKERRQ(ierr); 235d88bfacbSStefano Zampini 236d88bfacbSStefano Zampini /* apply preconditioner on each processor */ 237d88bfacbSStefano Zampini ierr = KSPSolveTranspose(red->ksp,red->xsub,red->ysub);CHKERRQ(ierr); 238d88bfacbSStefano Zampini ierr = VecResetArray(red->xsub);CHKERRQ(ierr); 239d88bfacbSStefano Zampini ierr = VecRestoreArray(red->xdup,&array);CHKERRQ(ierr); 240d88bfacbSStefano Zampini 241d88bfacbSStefano Zampini /* place ysub's local array into ydup */ 242d88bfacbSStefano Zampini ierr = VecGetArray(red->ysub,&array);CHKERRQ(ierr); 243d88bfacbSStefano Zampini ierr = VecPlaceArray(red->ydup,(const PetscScalar*)array);CHKERRQ(ierr); 244d88bfacbSStefano Zampini 245d88bfacbSStefano Zampini /* scatter ydup to y */ 246d88bfacbSStefano Zampini ierr = VecScatterBegin(red->scatterout,red->ydup,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 247d88bfacbSStefano Zampini ierr = VecScatterEnd(red->scatterout,red->ydup,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 248d88bfacbSStefano Zampini ierr = VecResetArray(red->ydup);CHKERRQ(ierr); 249d88bfacbSStefano Zampini ierr = VecRestoreArray(red->ysub,&array);CHKERRQ(ierr); 250d88bfacbSStefano Zampini PetscFunctionReturn(0); 251d88bfacbSStefano Zampini } 252d88bfacbSStefano Zampini 253d88bfacbSStefano Zampini #undef __FUNCT__ 2541ea5a559SBarry Smith #define __FUNCT__ "PCReset_Redundant" 2551ea5a559SBarry Smith static PetscErrorCode PCReset_Redundant(PC pc) 2564b9ad928SBarry Smith { 2574b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 258dfbe8321SBarry Smith PetscErrorCode ierr; 2594b9ad928SBarry Smith 2604b9ad928SBarry Smith PetscFunctionBegin; 2611b81debcSHong Zhang if (red->useparallelmat) { 2626bf464f9SBarry Smith ierr = VecScatterDestroy(&red->scatterin);CHKERRQ(ierr); 2636bf464f9SBarry Smith ierr = VecScatterDestroy(&red->scatterout);CHKERRQ(ierr); 2646bf464f9SBarry Smith ierr = VecDestroy(&red->ysub);CHKERRQ(ierr); 2656bf464f9SBarry Smith ierr = VecDestroy(&red->xsub);CHKERRQ(ierr); 2666bf464f9SBarry Smith ierr = VecDestroy(&red->xdup);CHKERRQ(ierr); 2676bf464f9SBarry Smith ierr = VecDestroy(&red->ydup);CHKERRQ(ierr); 2681b81debcSHong Zhang } 2696bf464f9SBarry Smith ierr = MatDestroy(&red->pmats);CHKERRQ(ierr); 2701b81debcSHong Zhang ierr = KSPReset(red->ksp);CHKERRQ(ierr); 2711ea5a559SBarry Smith PetscFunctionReturn(0); 2721ea5a559SBarry Smith } 2731ea5a559SBarry Smith 2741ea5a559SBarry Smith #undef __FUNCT__ 2751ea5a559SBarry Smith #define __FUNCT__ "PCDestroy_Redundant" 2761ea5a559SBarry Smith static PetscErrorCode PCDestroy_Redundant(PC pc) 2771ea5a559SBarry Smith { 2781ea5a559SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 2791ea5a559SBarry Smith PetscErrorCode ierr; 2801ea5a559SBarry Smith 2811ea5a559SBarry Smith PetscFunctionBegin; 2821ea5a559SBarry Smith ierr = PCReset_Redundant(pc);CHKERRQ(ierr); 2836bf464f9SBarry Smith ierr = KSPDestroy(&red->ksp);CHKERRQ(ierr); 2846bf464f9SBarry Smith ierr = PetscSubcommDestroy(&red->psubcomm);CHKERRQ(ierr); 285c31cb41cSBarry Smith ierr = PetscFree(pc->data);CHKERRQ(ierr); 2864b9ad928SBarry Smith PetscFunctionReturn(0); 2874b9ad928SBarry Smith } 2884b9ad928SBarry Smith 2894b9ad928SBarry Smith #undef __FUNCT__ 2904b9ad928SBarry Smith #define __FUNCT__ "PCSetFromOptions_Redundant" 2918c34d3f5SBarry Smith static PetscErrorCode PCSetFromOptions_Redundant(PetscOptions *PetscOptionsObject,PC pc) 2924b9ad928SBarry Smith { 293a98ce0f4SHong Zhang PetscErrorCode ierr; 294a98ce0f4SHong Zhang PC_Redundant *red = (PC_Redundant*)pc->data; 295a98ce0f4SHong Zhang 2964b9ad928SBarry Smith PetscFunctionBegin; 297e55864a3SBarry Smith ierr = PetscOptionsHead(PetscOptionsObject,"Redundant options");CHKERRQ(ierr); 29809a6bc64SHong Zhang ierr = PetscOptionsInt("-pc_redundant_number","Number of redundant pc","PCRedundantSetNumber",red->nsubcomm,&red->nsubcomm,0);CHKERRQ(ierr); 299a98ce0f4SHong Zhang ierr = PetscOptionsTail();CHKERRQ(ierr); 3004b9ad928SBarry Smith PetscFunctionReturn(0); 3014b9ad928SBarry Smith } 3024b9ad928SBarry Smith 3034b9ad928SBarry Smith #undef __FUNCT__ 30409a6bc64SHong Zhang #define __FUNCT__ "PCRedundantSetNumber_Redundant" 305f7a08781SBarry Smith static PetscErrorCode PCRedundantSetNumber_Redundant(PC pc,PetscInt nreds) 30609a6bc64SHong Zhang { 30709a6bc64SHong Zhang PC_Redundant *red = (PC_Redundant*)pc->data; 30809a6bc64SHong Zhang 30909a6bc64SHong Zhang PetscFunctionBegin; 31009a6bc64SHong Zhang red->nsubcomm = nreds; 31109a6bc64SHong Zhang PetscFunctionReturn(0); 31209a6bc64SHong Zhang } 31309a6bc64SHong Zhang 31409a6bc64SHong Zhang #undef __FUNCT__ 31509a6bc64SHong Zhang #define __FUNCT__ "PCRedundantSetNumber" 31609a6bc64SHong Zhang /*@ 31709a6bc64SHong Zhang PCRedundantSetNumber - Sets the number of redundant preconditioner contexts. 31809a6bc64SHong Zhang 3193f9fe445SBarry Smith Logically Collective on PC 32009a6bc64SHong Zhang 32109a6bc64SHong Zhang Input Parameters: 32209a6bc64SHong Zhang + pc - the preconditioner context 3239b21d695SBarry Smith - nredundant - number of redundant preconditioner contexts; for example if you are using 64 MPI processes and 3249b21d695SBarry Smith use an nredundant of 4 there will be 4 parallel solves each on 16 = 64/4 processes. 32509a6bc64SHong Zhang 32609a6bc64SHong Zhang Level: advanced 32709a6bc64SHong Zhang 32809a6bc64SHong Zhang .keywords: PC, redundant solve 32909a6bc64SHong Zhang @*/ 3307087cfbeSBarry Smith PetscErrorCode PCRedundantSetNumber(PC pc,PetscInt nredundant) 33109a6bc64SHong Zhang { 3324ac538c5SBarry Smith PetscErrorCode ierr; 33309a6bc64SHong Zhang 33409a6bc64SHong Zhang PetscFunctionBegin; 3350700a824SBarry Smith PetscValidHeaderSpecific(pc,PC_CLASSID,1); 336ce94432eSBarry Smith if (nredundant <= 0) SETERRQ1(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_WRONG, "num of redundant pc %D must be positive",nredundant); 3374ac538c5SBarry Smith ierr = PetscTryMethod(pc,"PCRedundantSetNumber_C",(PC,PetscInt),(pc,nredundant));CHKERRQ(ierr); 33809a6bc64SHong Zhang PetscFunctionReturn(0); 33909a6bc64SHong Zhang } 34009a6bc64SHong Zhang 34109a6bc64SHong Zhang #undef __FUNCT__ 3424b9ad928SBarry Smith #define __FUNCT__ "PCRedundantSetScatter_Redundant" 343f7a08781SBarry Smith static PetscErrorCode PCRedundantSetScatter_Redundant(PC pc,VecScatter in,VecScatter out) 3444b9ad928SBarry Smith { 3454b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 346dfbe8321SBarry Smith PetscErrorCode ierr; 3474b9ad928SBarry Smith 3484b9ad928SBarry Smith PetscFunctionBegin; 3494b9ad928SBarry Smith ierr = PetscObjectReference((PetscObject)in);CHKERRQ(ierr); 3506bf464f9SBarry Smith ierr = VecScatterDestroy(&red->scatterin);CHKERRQ(ierr); 3512fa5cd67SKarl Rupp 352c3122656SLisandro Dalcin red->scatterin = in; 3532fa5cd67SKarl Rupp 3544b9ad928SBarry Smith ierr = PetscObjectReference((PetscObject)out);CHKERRQ(ierr); 3556bf464f9SBarry Smith ierr = VecScatterDestroy(&red->scatterout);CHKERRQ(ierr); 356c3122656SLisandro Dalcin red->scatterout = out; 3574b9ad928SBarry Smith PetscFunctionReturn(0); 3584b9ad928SBarry Smith } 3594b9ad928SBarry Smith 3604b9ad928SBarry Smith #undef __FUNCT__ 3614b9ad928SBarry Smith #define __FUNCT__ "PCRedundantSetScatter" 3624b9ad928SBarry Smith /*@ 3634b9ad928SBarry Smith PCRedundantSetScatter - Sets the scatter used to copy values into the 3644b9ad928SBarry Smith redundant local solve and the scatter to move them back into the global 3654b9ad928SBarry Smith vector. 3664b9ad928SBarry Smith 3673f9fe445SBarry Smith Logically Collective on PC 3684b9ad928SBarry Smith 3694b9ad928SBarry Smith Input Parameters: 3704b9ad928SBarry Smith + pc - the preconditioner context 3714b9ad928SBarry Smith . in - the scatter to move the values in 3724b9ad928SBarry Smith - out - the scatter to move them out 3734b9ad928SBarry Smith 3744b9ad928SBarry Smith Level: advanced 3754b9ad928SBarry Smith 3764b9ad928SBarry Smith .keywords: PC, redundant solve 3774b9ad928SBarry Smith @*/ 3787087cfbeSBarry Smith PetscErrorCode PCRedundantSetScatter(PC pc,VecScatter in,VecScatter out) 3794b9ad928SBarry Smith { 3804ac538c5SBarry Smith PetscErrorCode ierr; 3814b9ad928SBarry Smith 3824b9ad928SBarry Smith PetscFunctionBegin; 3830700a824SBarry Smith PetscValidHeaderSpecific(pc,PC_CLASSID,1); 3840700a824SBarry Smith PetscValidHeaderSpecific(in,VEC_SCATTER_CLASSID,2); 3850700a824SBarry Smith PetscValidHeaderSpecific(out,VEC_SCATTER_CLASSID,3); 3864ac538c5SBarry Smith ierr = PetscTryMethod(pc,"PCRedundantSetScatter_C",(PC,VecScatter,VecScatter),(pc,in,out));CHKERRQ(ierr); 3874b9ad928SBarry Smith PetscFunctionReturn(0); 3884b9ad928SBarry Smith } 3894b9ad928SBarry Smith 3904b9ad928SBarry Smith #undef __FUNCT__ 39183ab6a24SBarry Smith #define __FUNCT__ "PCRedundantGetKSP_Redundant" 392f7a08781SBarry Smith static PetscErrorCode PCRedundantGetKSP_Redundant(PC pc,KSP *innerksp) 3934b9ad928SBarry Smith { 3945f06b7aaSBarry Smith PetscErrorCode ierr; 3954b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 3965f06b7aaSBarry Smith MPI_Comm comm,subcomm; 3975f06b7aaSBarry Smith const char *prefix; 3984b9ad928SBarry Smith 3994b9ad928SBarry Smith PetscFunctionBegin; 4005f06b7aaSBarry Smith if (!red->psubcomm) { 4015f06b7aaSBarry Smith ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 402d8a68f86SHong Zhang ierr = PetscSubcommCreate(comm,&red->psubcomm);CHKERRQ(ierr); 403d8a68f86SHong Zhang ierr = PetscSubcommSetNumber(red->psubcomm,red->nsubcomm);CHKERRQ(ierr); 404d8a68f86SHong Zhang ierr = PetscSubcommSetType(red->psubcomm,PETSC_SUBCOMM_INTERLACED);CHKERRQ(ierr); 4053bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)pc,sizeof(PetscSubcomm));CHKERRQ(ierr); 4065f06b7aaSBarry Smith 4075f06b7aaSBarry Smith /* create a new PC that processors in each subcomm have copy of */ 408306c2d5bSBarry Smith subcomm = PetscSubcommChild(red->psubcomm); 4092fa5cd67SKarl Rupp 4105f06b7aaSBarry Smith ierr = KSPCreate(subcomm,&red->ksp);CHKERRQ(ierr); 411422a814eSBarry Smith ierr = KSPSetErrorIfNotConverged(red->ksp,pc->erroriffailure);CHKERRQ(ierr); 4125f06b7aaSBarry Smith ierr = PetscObjectIncrementTabLevel((PetscObject)red->ksp,(PetscObject)pc,1);CHKERRQ(ierr); 4133bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)red->ksp);CHKERRQ(ierr); 4145f06b7aaSBarry Smith ierr = KSPSetType(red->ksp,KSPPREONLY);CHKERRQ(ierr); 4155f06b7aaSBarry Smith ierr = KSPGetPC(red->ksp,&red->pc);CHKERRQ(ierr); 4165f06b7aaSBarry Smith ierr = PCSetType(red->pc,PCLU);CHKERRQ(ierr); 4175f06b7aaSBarry Smith 4185f06b7aaSBarry Smith ierr = PCGetOptionsPrefix(pc,&prefix);CHKERRQ(ierr); 4195f06b7aaSBarry Smith ierr = KSPSetOptionsPrefix(red->ksp,prefix);CHKERRQ(ierr); 4205f06b7aaSBarry Smith ierr = KSPAppendOptionsPrefix(red->ksp,"redundant_");CHKERRQ(ierr); 4215f06b7aaSBarry Smith } 42283ab6a24SBarry Smith *innerksp = red->ksp; 4234b9ad928SBarry Smith PetscFunctionReturn(0); 4244b9ad928SBarry Smith } 4254b9ad928SBarry Smith 4264b9ad928SBarry Smith #undef __FUNCT__ 42783ab6a24SBarry Smith #define __FUNCT__ "PCRedundantGetKSP" 4284b9ad928SBarry Smith /*@ 42983ab6a24SBarry Smith PCRedundantGetKSP - Gets the less parallel KSP created by the redundant PC. 4304b9ad928SBarry Smith 4314b9ad928SBarry Smith Not Collective 4324b9ad928SBarry Smith 4334b9ad928SBarry Smith Input Parameter: 4344b9ad928SBarry Smith . pc - the preconditioner context 4354b9ad928SBarry Smith 4364b9ad928SBarry Smith Output Parameter: 43783ab6a24SBarry Smith . innerksp - the KSP on the smaller set of processes 4384b9ad928SBarry Smith 4394b9ad928SBarry Smith Level: advanced 4404b9ad928SBarry Smith 4414b9ad928SBarry Smith .keywords: PC, redundant solve 4424b9ad928SBarry Smith @*/ 44383ab6a24SBarry Smith PetscErrorCode PCRedundantGetKSP(PC pc,KSP *innerksp) 4444b9ad928SBarry Smith { 4454ac538c5SBarry Smith PetscErrorCode ierr; 4464b9ad928SBarry Smith 4474b9ad928SBarry Smith PetscFunctionBegin; 4480700a824SBarry Smith PetscValidHeaderSpecific(pc,PC_CLASSID,1); 44983ab6a24SBarry Smith PetscValidPointer(innerksp,2); 45083ab6a24SBarry Smith ierr = PetscTryMethod(pc,"PCRedundantGetKSP_C",(PC,KSP*),(pc,innerksp));CHKERRQ(ierr); 4514b9ad928SBarry Smith PetscFunctionReturn(0); 4524b9ad928SBarry Smith } 4534b9ad928SBarry Smith 4544b9ad928SBarry Smith #undef __FUNCT__ 4554b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetOperators_Redundant" 456f7a08781SBarry Smith static PetscErrorCode PCRedundantGetOperators_Redundant(PC pc,Mat *mat,Mat *pmat) 4574b9ad928SBarry Smith { 4584b9ad928SBarry Smith PC_Redundant *red = (PC_Redundant*)pc->data; 4594b9ad928SBarry Smith 4604b9ad928SBarry Smith PetscFunctionBegin; 461b3804887SHong Zhang if (mat) *mat = red->pmats; 462b3804887SHong Zhang if (pmat) *pmat = red->pmats; 4634b9ad928SBarry Smith PetscFunctionReturn(0); 4644b9ad928SBarry Smith } 4654b9ad928SBarry Smith 4664b9ad928SBarry Smith #undef __FUNCT__ 4674b9ad928SBarry Smith #define __FUNCT__ "PCRedundantGetOperators" 4684b9ad928SBarry Smith /*@ 4694b9ad928SBarry Smith PCRedundantGetOperators - gets the sequential matrix and preconditioner matrix 4704b9ad928SBarry Smith 4714b9ad928SBarry Smith Not Collective 4724b9ad928SBarry Smith 4734b9ad928SBarry Smith Input Parameter: 4744b9ad928SBarry Smith . pc - the preconditioner context 4754b9ad928SBarry Smith 4764b9ad928SBarry Smith Output Parameters: 4774b9ad928SBarry Smith + mat - the matrix 4784b9ad928SBarry Smith - pmat - the (possibly different) preconditioner matrix 4794b9ad928SBarry Smith 4804b9ad928SBarry Smith Level: advanced 4814b9ad928SBarry Smith 4824b9ad928SBarry Smith .keywords: PC, redundant solve 4834b9ad928SBarry Smith @*/ 4847087cfbeSBarry Smith PetscErrorCode PCRedundantGetOperators(PC pc,Mat *mat,Mat *pmat) 4854b9ad928SBarry Smith { 4864ac538c5SBarry Smith PetscErrorCode ierr; 4874b9ad928SBarry Smith 4884b9ad928SBarry Smith PetscFunctionBegin; 4890700a824SBarry Smith PetscValidHeaderSpecific(pc,PC_CLASSID,1); 4904482741eSBarry Smith if (mat) PetscValidPointer(mat,2); 4914482741eSBarry Smith if (pmat) PetscValidPointer(pmat,3); 4924ac538c5SBarry Smith ierr = PetscTryMethod(pc,"PCRedundantGetOperators_C",(PC,Mat*,Mat*),(pc,mat,pmat));CHKERRQ(ierr); 4934b9ad928SBarry Smith PetscFunctionReturn(0); 4944b9ad928SBarry Smith } 4954b9ad928SBarry Smith 4964b9ad928SBarry Smith /* -------------------------------------------------------------------------------------*/ 49737a17b4dSBarry Smith /*MC 49883ab6a24SBarry Smith PCREDUNDANT - Runs a KSP solver with preconditioner for the entire problem on subgroups of processors 49937a17b4dSBarry Smith 50083ab6a24SBarry Smith Options for the redundant preconditioners can be set with -redundant_pc_xxx for the redundant KSP with -redundant_ksp_xxx 50137a17b4dSBarry Smith 50209391456SBarry Smith Options Database: 5039b21d695SBarry Smith . -pc_redundant_number <n> - number of redundant solves, for example if you are using 64 MPI processes and 5049b21d695SBarry Smith use an n of 4 there will be 4 parallel solves each on 16 = 64/4 processes. 50509391456SBarry Smith 50637a17b4dSBarry Smith Level: intermediate 50737a17b4dSBarry Smith 50883ab6a24SBarry Smith Notes: The default KSP is preonly and the default PC is LU. 50983ab6a24SBarry Smith 51083ab6a24SBarry Smith Developer Notes: Note that PCSetInitialGuessNonzero() is not used by this class but likely should be. 5119cfaa89bSBarry Smith 51237a17b4dSBarry Smith .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PCRedundantSetScatter(), 51383ab6a24SBarry Smith PCRedundantGetKSP(), PCRedundantGetOperators(), PCRedundantSetNumber() 51437a17b4dSBarry Smith M*/ 51537a17b4dSBarry Smith 5164b9ad928SBarry Smith #undef __FUNCT__ 5174b9ad928SBarry Smith #define __FUNCT__ "PCCreate_Redundant" 5188cc058d9SJed Brown PETSC_EXTERN PetscErrorCode PCCreate_Redundant(PC pc) 5194b9ad928SBarry Smith { 520dfbe8321SBarry Smith PetscErrorCode ierr; 5214b9ad928SBarry Smith PC_Redundant *red; 52269db28dcSHong Zhang PetscMPIInt size; 5233f457be1SHong Zhang 5244b9ad928SBarry Smith PetscFunctionBegin; 525b00a9115SJed Brown ierr = PetscNewLog(pc,&red);CHKERRQ(ierr); 526ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)pc),&size);CHKERRQ(ierr); 5272fa5cd67SKarl Rupp 52869db28dcSHong Zhang red->nsubcomm = size; 5294b9ad928SBarry Smith red->useparallelmat = PETSC_TRUE; 5301fbd8f88SHong Zhang pc->data = (void*)red; 5314b9ad928SBarry Smith 5324b9ad928SBarry Smith pc->ops->apply = PCApply_Redundant; 533d88bfacbSStefano Zampini pc->ops->applytranspose = PCApplyTranspose_Redundant; 5344b9ad928SBarry Smith pc->ops->setup = PCSetUp_Redundant; 5354b9ad928SBarry Smith pc->ops->destroy = PCDestroy_Redundant; 5361ea5a559SBarry Smith pc->ops->reset = PCReset_Redundant; 5374b9ad928SBarry Smith pc->ops->setfromoptions = PCSetFromOptions_Redundant; 5384b9ad928SBarry Smith pc->ops->view = PCView_Redundant; 5392fa5cd67SKarl Rupp 540bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCRedundantSetScatter_C",PCRedundantSetScatter_Redundant);CHKERRQ(ierr); 541bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCRedundantSetNumber_C",PCRedundantSetNumber_Redundant);CHKERRQ(ierr); 542bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCRedundantGetKSP_C",PCRedundantGetKSP_Redundant);CHKERRQ(ierr); 543bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCRedundantGetOperators_C",PCRedundantGetOperators_Redundant);CHKERRQ(ierr); 5444b9ad928SBarry Smith PetscFunctionReturn(0); 5454b9ad928SBarry Smith } 546b2573a8aSBarry Smith 547