1eaedb033SPeter Brune #include <petsc-private/snesimpl.h> /*I "petscsnes.h" I*/ 2111ade9eSPeter Brune #include <petscdm.h> 3eaedb033SPeter Brune 4eaedb033SPeter Brune typedef struct { 5eaedb033SPeter Brune PetscInt n; /* local subdomains */ 6eaedb033SPeter Brune SNES *subsnes; /* nonlinear solvers for each subdomain */ 7eaedb033SPeter Brune Vec *x; /* solution vectors */ 8111ade9eSPeter Brune Vec *xl; /* solution local vectors */ 9111ade9eSPeter Brune Vec *y; /* step vectors */ 10eaedb033SPeter Brune Vec *b; /* rhs vectors */ 11111ade9eSPeter Brune VecScatter *oscatter; /* scatter from global space to the subdomain global space */ 12111ade9eSPeter Brune VecScatter *iscatter; /* scatter from global space to the nonoverlapping subdomain space */ 13111ade9eSPeter Brune VecScatter *gscatter; /* scatter from global space to the subdomain local space */ 14111ade9eSPeter Brune PCASMType type; /* ASM type */ 15111ade9eSPeter Brune PetscBool usesdm; /* use the DM for setting up the subproblems */ 16b20c023fSPeter Brune 17b20c023fSPeter Brune /* logging events */ 18b20c023fSPeter Brune PetscLogEvent eventrestrictinterp; 19b20c023fSPeter Brune PetscLogEvent eventsubsolve; 20eaedb033SPeter Brune } SNES_NASM; 21eaedb033SPeter Brune 22b20c023fSPeter Brune const char *const SNESNASMTypes[] = {"NONE","RESTRICT","INTERPOLATE","BASIC","PCASMType","PC_ASM_",0}; 23b20c023fSPeter Brune 24eaedb033SPeter Brune #undef __FUNCT__ 25eaedb033SPeter Brune #define __FUNCT__ "SNESReset_NASM" 26eaedb033SPeter Brune PetscErrorCode SNESReset_NASM(SNES snes) 27eaedb033SPeter Brune { 28eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 29eaedb033SPeter Brune PetscErrorCode ierr; 30eaedb033SPeter Brune PetscInt i; 316e111a19SKarl Rupp 32eaedb033SPeter Brune PetscFunctionBegin; 33eaedb033SPeter Brune for (i=0; i<nasm->n; i++) { 34111ade9eSPeter Brune if (nasm->xl) { ierr = VecDestroy(&nasm->xl[i]);CHKERRQ(ierr); } 35f5f7c1b9SKarl Rupp if (nasm->x) { ierr = VecDestroy(&nasm->x[i]);CHKERRQ(ierr); } 36111ade9eSPeter Brune if (nasm->y) { ierr = VecDestroy(&nasm->y[i]);CHKERRQ(ierr); } 37bc8c1f72SJose Roman if (nasm->b) { ierr = VecDestroy(&nasm->b[i]);CHKERRQ(ierr); } 38eaedb033SPeter Brune 39bc8c1f72SJose Roman if (nasm->subsnes) { ierr = SNESDestroy(&nasm->subsnes[i]);CHKERRQ(ierr); } 40111ade9eSPeter Brune if (nasm->oscatter) { ierr = VecScatterDestroy(&nasm->oscatter[i]);CHKERRQ(ierr); } 41111ade9eSPeter Brune if (nasm->iscatter) { ierr = VecScatterDestroy(&nasm->iscatter[i]);CHKERRQ(ierr); } 42111ade9eSPeter Brune if (nasm->gscatter) { ierr = VecScatterDestroy(&nasm->gscatter[i]);CHKERRQ(ierr); } 43eaedb033SPeter Brune } 44111ade9eSPeter Brune 45111ade9eSPeter Brune if (nasm->x) {ierr = PetscFree(nasm->x);CHKERRQ(ierr);} 46111ade9eSPeter Brune if (nasm->xl) {ierr = PetscFree(nasm->xl);CHKERRQ(ierr);} 47111ade9eSPeter Brune if (nasm->y) {ierr = PetscFree(nasm->y);CHKERRQ(ierr);} 48111ade9eSPeter Brune if (nasm->b) {ierr = PetscFree(nasm->b);CHKERRQ(ierr);} 49111ade9eSPeter Brune 50111ade9eSPeter Brune if (nasm->subsnes) {ierr = PetscFree(nasm->subsnes);CHKERRQ(ierr);} 51111ade9eSPeter Brune if (nasm->oscatter) {ierr = PetscFree(nasm->oscatter);CHKERRQ(ierr);} 52111ade9eSPeter Brune if (nasm->iscatter) {ierr = PetscFree(nasm->iscatter);CHKERRQ(ierr);} 53111ade9eSPeter Brune if (nasm->gscatter) {ierr = PetscFree(nasm->gscatter);CHKERRQ(ierr);} 54b20c023fSPeter Brune 55b20c023fSPeter Brune nasm->eventrestrictinterp = 0; 56b20c023fSPeter Brune nasm->eventsubsolve = 0; 57eaedb033SPeter Brune PetscFunctionReturn(0); 58eaedb033SPeter Brune } 59eaedb033SPeter Brune 60eaedb033SPeter Brune #undef __FUNCT__ 61eaedb033SPeter Brune #define __FUNCT__ "SNESDestroy_NASM" 62eaedb033SPeter Brune PetscErrorCode SNESDestroy_NASM(SNES snes) 63eaedb033SPeter Brune { 64eaedb033SPeter Brune PetscErrorCode ierr; 656e111a19SKarl Rupp 66eaedb033SPeter Brune PetscFunctionBegin; 67eaedb033SPeter Brune ierr = SNESReset_NASM(snes);CHKERRQ(ierr); 6822d28d08SBarry Smith ierr = PetscFree(snes->data);CHKERRQ(ierr); 69eaedb033SPeter Brune PetscFunctionReturn(0); 70eaedb033SPeter Brune } 71eaedb033SPeter Brune 72eaedb033SPeter Brune #undef __FUNCT__ 73111ade9eSPeter Brune #define __FUNCT__ "DMGlobalToLocalSubDomainDirichletHook_Private" 740adebc6cSBarry Smith PetscErrorCode DMGlobalToLocalSubDomainDirichletHook_Private(DM dm,Vec g,InsertMode mode,Vec l,void *ctx) 750adebc6cSBarry Smith { 76111ade9eSPeter Brune PetscErrorCode ierr; 77111ade9eSPeter Brune Vec bcs = (Vec)ctx; 786e111a19SKarl Rupp 79111ade9eSPeter Brune PetscFunctionBegin; 80111ade9eSPeter Brune ierr = VecCopy(bcs,l);CHKERRQ(ierr); 81111ade9eSPeter Brune PetscFunctionReturn(0); 82111ade9eSPeter Brune } 83111ade9eSPeter Brune 84111ade9eSPeter Brune #undef __FUNCT__ 85eaedb033SPeter Brune #define __FUNCT__ "SNESSetUp_NASM" 86eaedb033SPeter Brune PetscErrorCode SNESSetUp_NASM(SNES snes) 87eaedb033SPeter Brune { 88eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 89eaedb033SPeter Brune PetscErrorCode ierr; 900a696f66SPeter Brune DM dm,ddm; 91111ade9eSPeter Brune DM *subdms; 92111ade9eSPeter Brune PetscInt i; 93eaedb033SPeter Brune const char *optionsprefix; 94111ade9eSPeter Brune Vec F; 95eaedb033SPeter Brune 96eaedb033SPeter Brune PetscFunctionBegin; 97eaedb033SPeter Brune if (!nasm->subsnes) { 98eaedb033SPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 990a696f66SPeter Brune if (dm) { 100eaedb033SPeter Brune nasm->usesdm = PETSC_TRUE; 1010298fd71SBarry Smith ierr = DMCreateDomainDecomposition(dm,&nasm->n,NULL,NULL,NULL,&subdms);CHKERRQ(ierr); 1020a696f66SPeter Brune if (!subdms) { 1030a696f66SPeter Brune ierr = DMCreateDomainDecompositionDM(dm,"default",&ddm);CHKERRQ(ierr); 104f23aa3ddSBarry Smith if (!ddm) SETERRQ(((PetscObject)dm)->comm,PETSC_ERR_ARG_WRONGSTATE,"DM has no default decomposition defined. Set subsolves manually with SNESNASMSetSubdomains()."); 1050a696f66SPeter Brune ierr = SNESSetDM(snes,ddm);CHKERRQ(ierr); 1060a696f66SPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 1070298fd71SBarry Smith ierr = DMCreateDomainDecomposition(dm,&nasm->n,NULL,NULL,NULL,&subdms);CHKERRQ(ierr); 1080a696f66SPeter Brune } 109f23aa3ddSBarry Smith if (!subdms) SETERRQ(((PetscObject)dm)->comm,PETSC_ERR_ARG_WRONGSTATE,"DM has no default decomposition defined. Set subsolves manually with SNESNASMSetSubdomains()."); 110111ade9eSPeter Brune ierr = DMCreateDomainDecompositionScatters(dm,nasm->n,subdms,&nasm->iscatter,&nasm->oscatter,&nasm->gscatter);CHKERRQ(ierr); 111eaedb033SPeter Brune 112eaedb033SPeter Brune ierr = SNESGetOptionsPrefix(snes, &optionsprefix);CHKERRQ(ierr); 113111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(SNES),&nasm->subsnes);CHKERRQ(ierr); 114111ade9eSPeter Brune 115111ade9eSPeter Brune for (i=0; i<nasm->n; i++) { 116cdb298fcSPeter Brune ierr = SNESCreate(PETSC_COMM_SELF,&nasm->subsnes[i]);CHKERRQ(ierr); 117cdb298fcSPeter Brune ierr = SNESAppendOptionsPrefix(nasm->subsnes[i],optionsprefix);CHKERRQ(ierr); 118cdb298fcSPeter Brune ierr = SNESAppendOptionsPrefix(nasm->subsnes[i],"sub_");CHKERRQ(ierr); 119cdb298fcSPeter Brune ierr = SNESSetDM(nasm->subsnes[i],subdms[i]);CHKERRQ(ierr); 120cdb298fcSPeter Brune ierr = SNESSetFromOptions(nasm->subsnes[i]);CHKERRQ(ierr); 121111ade9eSPeter Brune ierr = DMDestroy(&subdms[i]);CHKERRQ(ierr); 122111ade9eSPeter Brune } 123111ade9eSPeter Brune ierr = PetscFree(subdms);CHKERRQ(ierr); 124f23aa3ddSBarry Smith } else SETERRQ(((PetscObject)snes)->comm,PETSC_ERR_ARG_WRONGSTATE,"Cannot construct local problems automatically without a DM!"); 125f23aa3ddSBarry Smith } else SETERRQ(((PetscObject)snes)->comm,PETSC_ERR_ARG_WRONGSTATE,"Must set subproblems manually if there is no DM!"); 126111ade9eSPeter Brune /* allocate the global vectors */ 127111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->x);CHKERRQ(ierr); 128111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->xl);CHKERRQ(ierr); 129111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->y);CHKERRQ(ierr); 130111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->b);CHKERRQ(ierr); 131111ade9eSPeter Brune 132111ade9eSPeter Brune for (i=0; i<nasm->n; i++) { 133111ade9eSPeter Brune DM subdm; 1340298fd71SBarry Smith ierr = SNESGetFunction(nasm->subsnes[i],&F,NULL,NULL);CHKERRQ(ierr); 135111ade9eSPeter Brune ierr = VecDuplicate(F,&nasm->x[i]);CHKERRQ(ierr); 136111ade9eSPeter Brune ierr = VecDuplicate(F,&nasm->y[i]);CHKERRQ(ierr); 137111ade9eSPeter Brune ierr = VecDuplicate(F,&nasm->b[i]);CHKERRQ(ierr); 138111ade9eSPeter Brune ierr = SNESGetDM(nasm->subsnes[i],&subdm);CHKERRQ(ierr); 139111ade9eSPeter Brune ierr = DMCreateLocalVector(subdm,&nasm->xl[i]);CHKERRQ(ierr); 1400298fd71SBarry Smith ierr = DMGlobalToLocalHookAdd(subdm,DMGlobalToLocalSubDomainDirichletHook_Private,NULL,nasm->xl[i]);CHKERRQ(ierr); 141111ade9eSPeter Brune } 142eaedb033SPeter Brune PetscFunctionReturn(0); 143eaedb033SPeter Brune } 144eaedb033SPeter Brune 145eaedb033SPeter Brune #undef __FUNCT__ 146eaedb033SPeter Brune #define __FUNCT__ "SNESSetFromOptions_NASM" 147eaedb033SPeter Brune PetscErrorCode SNESSetFromOptions_NASM(SNES snes) 148eaedb033SPeter Brune { 149eaedb033SPeter Brune PetscErrorCode ierr; 1500a696f66SPeter Brune DM dm,ddm; 1510a696f66SPeter Brune char ddm_name[1024]; 152111ade9eSPeter Brune PCASMType asmtype; 153b20c023fSPeter Brune PetscBool flg,monflg; 154111ade9eSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 1556e111a19SKarl Rupp 156eaedb033SPeter Brune PetscFunctionBegin; 157111ade9eSPeter Brune ierr = PetscOptionsHead("Nonlinear Additive Schwartz options");CHKERRQ(ierr); 158111ade9eSPeter Brune ierr = PetscOptionsEnum("-snes_nasm_type","Type of restriction/extension","",SNESNASMTypes,(PetscEnum)nasm->type,(PetscEnum*)&asmtype,&flg);CHKERRQ(ierr); 1591aa26658SKarl Rupp if (flg) nasm->type = asmtype; 160b20c023fSPeter Brune flg = PETSC_FALSE; 161b20c023fSPeter Brune monflg = PETSC_TRUE; 162b20c023fSPeter Brune ierr = PetscOptionsBool("-snes_nasm_log","Log times for subSNES solves and restriction","",monflg,&monflg,&flg);CHKERRQ(ierr); 163b20c023fSPeter Brune if (flg) { 164b20c023fSPeter Brune ierr = PetscLogEventRegister("SNESNASMSubSolve",((PetscObject)snes)->classid,&nasm->eventsubsolve);CHKERRQ(ierr); 165b20c023fSPeter Brune ierr = PetscLogEventRegister("SNESNASMRestrict",((PetscObject)snes)->classid,&nasm->eventrestrictinterp);CHKERRQ(ierr); 166b20c023fSPeter Brune } 1670a696f66SPeter Brune ierr = PetscOptionsString("-snes_nasm_decomposition", "Name of the DM defining the composition", "SNESSetDM", ddm_name, ddm_name,1024,&flg);CHKERRQ(ierr); 1680a696f66SPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 1690a696f66SPeter Brune if (flg) { 1700a696f66SPeter Brune if (dm) { 1710a696f66SPeter Brune ierr = DMCreateDomainDecompositionDM(dm, ddm_name, &ddm);CHKERRQ(ierr); 172f23aa3ddSBarry Smith if (!ddm) SETERRQ1(((PetscObject)snes)->comm, PETSC_ERR_ARG_WRONGSTATE, "Unknown DM decomposition name %s", ddm_name); 1730a696f66SPeter Brune ierr = PetscInfo(snes,"Using domain decomposition DM defined using options database\n");CHKERRQ(ierr); 1740a696f66SPeter Brune ierr = SNESSetDM(snes,ddm);CHKERRQ(ierr); 175f23aa3ddSBarry Smith } else SETERRQ(((PetscObject)snes)->comm, PETSC_ERR_ARG_WRONGSTATE, "No DM to decompose"); 1760a696f66SPeter Brune } 177eaedb033SPeter Brune ierr = PetscOptionsTail();CHKERRQ(ierr); 178eaedb033SPeter Brune PetscFunctionReturn(0); 179eaedb033SPeter Brune } 180eaedb033SPeter Brune 181eaedb033SPeter Brune #undef __FUNCT__ 182eaedb033SPeter Brune #define __FUNCT__ "SNESView_NASM" 183eaedb033SPeter Brune PetscErrorCode SNESView_NASM(SNES snes, PetscViewer viewer) 184eaedb033SPeter Brune { 185eaedb033SPeter Brune PetscFunctionBegin; 186b20c023fSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 187b20c023fSPeter Brune PetscErrorCode ierr; 188b20c023fSPeter Brune PetscMPIInt rank; 189b20c023fSPeter Brune PetscInt i,N; 190b20c023fSPeter Brune PetscBool iascii,isstring; 191b20c023fSPeter Brune PetscViewer sviewer; 192b20c023fSPeter Brune MPI_Comm comm = ((PetscObject)snes)->comm; 193b20c023fSPeter Brune 194b20c023fSPeter Brune PetscFunctionBegin; 195b20c023fSPeter Brune ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 196b20c023fSPeter Brune ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERSTRING,&isstring);CHKERRQ(ierr); 197b20c023fSPeter Brune ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 198b20c023fSPeter Brune ierr = MPI_Reduce(&nasm->n,&N,1,MPIU_INT,MPIU_SUM,0,comm);CHKERRQ(ierr); 199b20c023fSPeter Brune if (iascii) { 200b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer, " Nonlinear Additive Schwarz: total subdomain blocks = %D\n",N);CHKERRQ(ierr); 201b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer," Nonlinear Additive Schwarz: restriction/interpolation type - %s\n",SNESNASMTypes[nasm->type]);CHKERRQ(ierr); 202b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer," Nonlinear Additive Schwarz: subSNES iterations: %D subKSP iterations: %D\n",SNESNASMTypes[nasm->type]);CHKERRQ(ierr); 203b20c023fSPeter Brune ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 204b20c023fSPeter Brune ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] number of local blocks = %D\n",(int)rank,nasm->n);CHKERRQ(ierr); 205b20c023fSPeter Brune ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 206b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer," Local SNES objects:\n");CHKERRQ(ierr); 207b20c023fSPeter Brune ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 208b20c023fSPeter Brune if (!rank) { 209b20c023fSPeter Brune for (i=0; i<nasm->n; i++) { 210b20c023fSPeter Brune ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 211b20c023fSPeter Brune ierr = SNESView(nasm->subsnes[i],sviewer);CHKERRQ(ierr); 212b20c023fSPeter Brune ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 213b20c023fSPeter Brune } 214b20c023fSPeter Brune } 215b20c023fSPeter Brune ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 216b20c023fSPeter Brune ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 217b20c023fSPeter Brune ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 218b20c023fSPeter Brune } else if (isstring) { 219b20c023fSPeter Brune ierr = PetscViewerStringSPrintf(viewer," blocks=%D,type=%s",N,SNESNASMTypes[nasm->type]);CHKERRQ(ierr); 220b20c023fSPeter Brune ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 221b20c023fSPeter Brune if (nasm->subsnes && !rank) {ierr = SNESView(nasm->subsnes[0],sviewer);CHKERRQ(ierr);} 222b20c023fSPeter Brune ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 223b20c023fSPeter Brune } 224eaedb033SPeter Brune PetscFunctionReturn(0); 225eaedb033SPeter Brune } 226eaedb033SPeter Brune 227eaedb033SPeter Brune #undef __FUNCT__ 228eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSetSubdomains" 229a6dfd86eSKarl Rupp PetscErrorCode SNESNASMSetSubdomains(SNES snes,PetscInt n,SNES subsnes[],VecScatter iscatter[],VecScatter oscatter[],VecScatter gscatter[]) 230a6dfd86eSKarl Rupp { 231eaedb033SPeter Brune PetscErrorCode ierr; 232111ade9eSPeter Brune PetscErrorCode (*f)(SNES,PetscInt,SNES*,VecScatter*,VecScatter*,VecScatter*); 2336e111a19SKarl Rupp 234eaedb033SPeter Brune PetscFunctionBegin; 235eaedb033SPeter Brune ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMSetSubdomains_C",(void (**)(void))&f);CHKERRQ(ierr); 236111ade9eSPeter Brune ierr = (f)(snes,n,subsnes,iscatter,oscatter,gscatter);CHKERRQ(ierr); 237eaedb033SPeter Brune PetscFunctionReturn(0); 238eaedb033SPeter Brune } 239eaedb033SPeter Brune 240eaedb033SPeter Brune EXTERN_C_BEGIN 241eaedb033SPeter Brune #undef __FUNCT__ 242eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSetSubdomains_NASM" 243a6dfd86eSKarl Rupp PetscErrorCode SNESNASMSetSubdomains_NASM(SNES snes,PetscInt n,SNES subsnes[],VecScatter iscatter[],VecScatter oscatter[],VecScatter gscatter[]) 244a6dfd86eSKarl Rupp { 245eaedb033SPeter Brune PetscInt i; 246eaedb033SPeter Brune PetscErrorCode ierr; 247eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 2486e111a19SKarl Rupp 249eaedb033SPeter Brune PetscFunctionBegin; 250eaedb033SPeter Brune if (snes->setupcalled) SETERRQ(((PetscObject)snes)->comm,PETSC_ERR_ARG_WRONGSTATE,"SNESNASMSetSubdomains() should be called before calling SNESSetUp()."); 251eaedb033SPeter Brune 252111ade9eSPeter Brune /* tear down the previously set things */ 253111ade9eSPeter Brune ierr = SNESReset(snes);CHKERRQ(ierr); 254111ade9eSPeter Brune 255eaedb033SPeter Brune nasm->n = n; 256111ade9eSPeter Brune if (oscatter) { 257111ade9eSPeter Brune for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)oscatter[i]);CHKERRQ(ierr);} 258eaedb033SPeter Brune } 259111ade9eSPeter Brune if (iscatter) { 260111ade9eSPeter Brune for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)iscatter[i]);CHKERRQ(ierr);} 261eaedb033SPeter Brune } 262111ade9eSPeter Brune if (gscatter) { 263111ade9eSPeter Brune for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)gscatter[i]);CHKERRQ(ierr);} 264111ade9eSPeter Brune } 265111ade9eSPeter Brune if (oscatter) { 266111ade9eSPeter Brune ierr = PetscMalloc(n*sizeof(IS),&nasm->oscatter);CHKERRQ(ierr); 267eaedb033SPeter Brune for (i=0; i<n; i++) { 268111ade9eSPeter Brune nasm->oscatter[i] = oscatter[i]; 269eaedb033SPeter Brune } 270111ade9eSPeter Brune } 271111ade9eSPeter Brune if (iscatter) { 272111ade9eSPeter Brune ierr = PetscMalloc(n*sizeof(IS),&nasm->iscatter);CHKERRQ(ierr); 273eaedb033SPeter Brune for (i=0; i<n; i++) { 274111ade9eSPeter Brune nasm->iscatter[i] = iscatter[i]; 275eaedb033SPeter Brune } 276eaedb033SPeter Brune } 277111ade9eSPeter Brune if (gscatter) { 278111ade9eSPeter Brune ierr = PetscMalloc(n*sizeof(IS),&nasm->gscatter);CHKERRQ(ierr); 279eaedb033SPeter Brune for (i=0; i<n; i++) { 280111ade9eSPeter Brune nasm->gscatter[i] = gscatter[i]; 281eaedb033SPeter Brune } 282eaedb033SPeter Brune } 283111ade9eSPeter Brune 284eaedb033SPeter Brune if (subsnes) { 285eaedb033SPeter Brune ierr = PetscMalloc(n*sizeof(SNES),&nasm->subsnes);CHKERRQ(ierr); 286eaedb033SPeter Brune for (i=0; i<n; i++) { 287eaedb033SPeter Brune nasm->subsnes[i] = subsnes[i]; 288eaedb033SPeter Brune } 289eaedb033SPeter Brune } 290eaedb033SPeter Brune PetscFunctionReturn(0); 291eaedb033SPeter Brune } 292eaedb033SPeter Brune EXTERN_C_END 293eaedb033SPeter Brune 294eaedb033SPeter Brune #undef __FUNCT__ 295eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSolveLocal_Private" 2960adebc6cSBarry Smith PetscErrorCode SNESNASMSolveLocal_Private(SNES snes,Vec B,Vec Y,Vec X) 2970adebc6cSBarry Smith { 298eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 299258e1594SPeter Brune SNES subsnes; 300eaedb033SPeter Brune PetscInt i; 301eaedb033SPeter Brune PetscErrorCode ierr; 302111ade9eSPeter Brune Vec Xlloc,Xl,Bl,Yl; 303111ade9eSPeter Brune VecScatter iscat,oscat,gscat; 304111ade9eSPeter Brune DM dm,subdm; 3050adebc6cSBarry Smith 306eaedb033SPeter Brune PetscFunctionBegin; 307eaedb033SPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 308111ade9eSPeter Brune ierr = VecSet(Y,0);CHKERRQ(ierr); 309b20c023fSPeter Brune 310b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 311eaedb033SPeter Brune for (i=0; i<nasm->n; i++) { 31270c78f05SPeter Brune /* scatter the solution to the local solution */ 31370c78f05SPeter Brune Xlloc = nasm->xl[i]; 31470c78f05SPeter Brune gscat = nasm->gscatter[i]; 31570c78f05SPeter Brune oscat = nasm->oscatter[i]; 31670c78f05SPeter Brune ierr = VecScatterBegin(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 31770c78f05SPeter Brune if (B) { 31870c78f05SPeter Brune /* scatter the RHS to the local RHS */ 31970c78f05SPeter Brune Bl = nasm->b[i]; 32070c78f05SPeter Brune ierr = VecScatterBegin(oscat,B,Bl,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 32170c78f05SPeter Brune } else { 3220298fd71SBarry Smith Bl = NULL; 32370c78f05SPeter Brune } 32470c78f05SPeter Brune } 325b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 326b20c023fSPeter Brune 32770c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 32870c78f05SPeter Brune Xlloc = nasm->xl[i]; 32970c78f05SPeter Brune ierr = VecScatterEnd(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33070c78f05SPeter Brune if (B) { 33170c78f05SPeter Brune ierr = VecScatterEnd(oscat,B,Bl,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33270c78f05SPeter Brune } 33370c78f05SPeter Brune } 334b20c023fSPeter Brune 335b20c023fSPeter Brune if (nasm->eventsubsolve) {ierr = PetscLogEventBegin(nasm->eventsubsolve,snes,0,0,0);CHKERRQ(ierr);} 33670c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 33770c78f05SPeter Brune Xl = nasm->x[i]; 33870c78f05SPeter Brune Xlloc = nasm->xl[i]; 33970c78f05SPeter Brune Yl = nasm->y[i]; 340258e1594SPeter Brune subsnes = nasm->subsnes[i]; 341258e1594SPeter Brune ierr = SNESGetDM(subsnes,&subdm);CHKERRQ(ierr); 342111ade9eSPeter Brune iscat = nasm->iscatter[i]; 343111ade9eSPeter Brune oscat = nasm->oscatter[i]; 344111ade9eSPeter Brune gscat = nasm->gscatter[i]; 345111ade9eSPeter Brune ierr = DMSubDomainRestrict(dm,oscat,gscat,subdm);CHKERRQ(ierr); 346111ade9eSPeter Brune 34770c78f05SPeter Brune ierr = DMLocalToGlobalBegin(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr); 34870c78f05SPeter Brune ierr = DMLocalToGlobalEnd(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr); 349111ade9eSPeter Brune ierr = VecCopy(Xl,Yl);CHKERRQ(ierr); 350258e1594SPeter Brune ierr = SNESSolve(subsnes,Bl,Yl);CHKERRQ(ierr); 351111ade9eSPeter Brune ierr = VecAXPY(Yl,-1.0,Xl);CHKERRQ(ierr); 35270c78f05SPeter Brune } 353b20c023fSPeter Brune if (nasm->eventsubsolve) {ierr = PetscLogEventEnd(nasm->eventsubsolve,snes,0,0,0);CHKERRQ(ierr);} 354111ade9eSPeter Brune 35570c78f05SPeter Brune ierr = MPI_Barrier(((PetscObject)snes)->comm);CHKERRQ(ierr); 35670c78f05SPeter Brune 357b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 35870c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 35970c78f05SPeter Brune Yl = nasm->y[i]; 36070c78f05SPeter Brune iscat = nasm->iscatter[i]; 36170c78f05SPeter Brune oscat = nasm->oscatter[i]; 362111ade9eSPeter Brune if (nasm->type == PC_ASM_BASIC) { 363111ade9eSPeter Brune ierr = VecScatterBegin(oscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 364111ade9eSPeter Brune } else if (nasm->type == PC_ASM_RESTRICT) { 365111ade9eSPeter Brune ierr = VecScatterBegin(iscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 366b20c023fSPeter Brune } else SETERRQ(((PetscObject)snes)->comm,PETSC_ERR_ARG_WRONGSTATE,"Only basic and restrict types are supported for SNESNASM"); 367eaedb033SPeter Brune } 368eaedb033SPeter Brune 36970c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 37070c78f05SPeter Brune Yl = nasm->y[i]; 37170c78f05SPeter Brune iscat = nasm->iscatter[i]; 37270c78f05SPeter Brune oscat = nasm->oscatter[i]; 37370c78f05SPeter Brune if (nasm->type == PC_ASM_BASIC) { 37470c78f05SPeter Brune ierr = VecScatterEnd(oscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 37570c78f05SPeter Brune } else if (nasm->type == PC_ASM_RESTRICT) { 37670c78f05SPeter Brune ierr = VecScatterEnd(iscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 377b20c023fSPeter Brune } else SETERRQ(((PetscObject)snes)->comm,PETSC_ERR_ARG_WRONGSTATE,"Only basic and restrict types are supported for SNESNASM"); 37870c78f05SPeter Brune } 379b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 38070c78f05SPeter Brune 38170c78f05SPeter Brune ierr = MPI_Barrier(((PetscObject)snes)->comm);CHKERRQ(ierr); 382cd939e56SPeter Brune 383111ade9eSPeter Brune ierr = VecAXPY(X,1.0,Y);CHKERRQ(ierr); 384eaedb033SPeter Brune PetscFunctionReturn(0); 385eaedb033SPeter Brune } 386eaedb033SPeter Brune 387eaedb033SPeter Brune #undef __FUNCT__ 388eaedb033SPeter Brune #define __FUNCT__ "SNESSolve_NASM" 389eaedb033SPeter Brune PetscErrorCode SNESSolve_NASM(SNES snes) 390eaedb033SPeter Brune { 391eaedb033SPeter Brune Vec F; 392eaedb033SPeter Brune Vec X; 393eaedb033SPeter Brune Vec B; 394111ade9eSPeter Brune Vec Y; 395eaedb033SPeter Brune PetscInt i; 396eaedb033SPeter Brune PetscReal fnorm; 397eaedb033SPeter Brune PetscErrorCode ierr; 398eaedb033SPeter Brune SNESNormType normtype; 399eaedb033SPeter Brune 400eaedb033SPeter Brune PetscFunctionBegin; 401eaedb033SPeter Brune X = snes->vec_sol; 402111ade9eSPeter Brune Y = snes->vec_sol_update; 403eaedb033SPeter Brune F = snes->vec_func; 404eaedb033SPeter Brune B = snes->vec_rhs; 405eaedb033SPeter Brune 406eaedb033SPeter Brune ierr = PetscObjectTakeAccess(snes);CHKERRQ(ierr); 407eaedb033SPeter Brune snes->iter = 0; 408eaedb033SPeter Brune snes->norm = 0.; 409eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 410eaedb033SPeter Brune snes->reason = SNES_CONVERGED_ITERATING; 411eaedb033SPeter Brune ierr = SNESGetNormType(snes, &normtype);CHKERRQ(ierr); 412eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION || normtype == SNES_NORM_INITIAL_ONLY || normtype == SNES_NORM_INITIAL_FINAL_ONLY) { 413eaedb033SPeter Brune /* compute the initial function and preconditioned update delX */ 414eaedb033SPeter Brune if (!snes->vec_func_init_set) { 415eaedb033SPeter Brune ierr = SNESComputeFunction(snes,X,F);CHKERRQ(ierr); 416eaedb033SPeter Brune if (snes->domainerror) { 417eaedb033SPeter Brune snes->reason = SNES_DIVERGED_FUNCTION_DOMAIN; 418eaedb033SPeter Brune PetscFunctionReturn(0); 419eaedb033SPeter Brune } 4201aa26658SKarl Rupp } else snes->vec_func_init_set = PETSC_FALSE; 421eaedb033SPeter Brune 422eaedb033SPeter Brune /* convergence test */ 423eaedb033SPeter Brune if (!snes->norm_init_set) { 424eaedb033SPeter Brune ierr = VecNorm(F, NORM_2, &fnorm);CHKERRQ(ierr); /* fnorm <- ||F|| */ 425eaedb033SPeter Brune if (PetscIsInfOrNanReal(fnorm)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FP,"Infinite or not-a-number generated in norm"); 426eaedb033SPeter Brune } else { 427eaedb033SPeter Brune fnorm = snes->norm_init; 428eaedb033SPeter Brune snes->norm_init_set = PETSC_FALSE; 429eaedb033SPeter Brune } 430eaedb033SPeter Brune ierr = PetscObjectTakeAccess(snes);CHKERRQ(ierr); 431eaedb033SPeter Brune snes->iter = 0; 432eaedb033SPeter Brune snes->norm = fnorm; 433eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 434*a71f0d7dSBarry Smith ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr); 435eaedb033SPeter Brune ierr = SNESMonitor(snes,0,snes->norm);CHKERRQ(ierr); 436eaedb033SPeter Brune 437eaedb033SPeter Brune /* set parameter for default relative tolerance convergence test */ 438eaedb033SPeter Brune snes->ttol = fnorm*snes->rtol; 439eaedb033SPeter Brune 440eaedb033SPeter Brune /* test convergence */ 441eaedb033SPeter Brune ierr = (*snes->ops->converged)(snes,0,0.0,0.0,fnorm,&snes->reason,snes->cnvP);CHKERRQ(ierr); 442eaedb033SPeter Brune if (snes->reason) PetscFunctionReturn(0); 443eaedb033SPeter Brune } else { 444eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 445*a71f0d7dSBarry Smith ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr); 446eaedb033SPeter Brune ierr = SNESMonitor(snes,0,snes->norm);CHKERRQ(ierr); 447eaedb033SPeter Brune } 448eaedb033SPeter Brune 449eaedb033SPeter Brune /* Call general purpose update function */ 450eaedb033SPeter Brune if (snes->ops->update) { 451eaedb033SPeter Brune ierr = (*snes->ops->update)(snes, snes->iter);CHKERRQ(ierr); 452eaedb033SPeter Brune } 453eaedb033SPeter Brune 454eaedb033SPeter Brune for (i = 0; i < snes->max_its; i++) { 455111ade9eSPeter Brune ierr = SNESNASMSolveLocal_Private(snes,B,Y,X);CHKERRQ(ierr); 456eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION || ((i == snes->max_its - 1) && (normtype == SNES_NORM_INITIAL_FINAL_ONLY || normtype == SNES_NORM_FINAL_ONLY))) { 457eaedb033SPeter Brune ierr = SNESComputeFunction(snes,X,F);CHKERRQ(ierr); 458eaedb033SPeter Brune if (snes->domainerror) { 459eaedb033SPeter Brune snes->reason = SNES_DIVERGED_FUNCTION_DOMAIN; 460eaedb033SPeter Brune PetscFunctionReturn(0); 461eaedb033SPeter Brune } 462eaedb033SPeter Brune ierr = VecNorm(F, NORM_2, &fnorm);CHKERRQ(ierr); /* fnorm <- ||F|| */ 463eaedb033SPeter Brune if (PetscIsInfOrNanReal(fnorm)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FP,"Infinite or not-a-number generated in norm"); 464eaedb033SPeter Brune } 465eaedb033SPeter Brune /* Monitor convergence */ 466eaedb033SPeter Brune ierr = PetscObjectTakeAccess(snes);CHKERRQ(ierr); 467eaedb033SPeter Brune snes->iter = i+1; 468eaedb033SPeter Brune snes->norm = fnorm; 469eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 470*a71f0d7dSBarry Smith ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr); 471eaedb033SPeter Brune ierr = SNESMonitor(snes,snes->iter,snes->norm);CHKERRQ(ierr); 472eaedb033SPeter Brune /* Test for convergence */ 473eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION) ierr = (*snes->ops->converged)(snes,snes->iter,0.0,0.0,fnorm,&snes->reason,snes->cnvP);CHKERRQ(ierr); 474eaedb033SPeter Brune if (snes->reason) PetscFunctionReturn(0); 475eaedb033SPeter Brune /* Call general purpose update function */ 476eaedb033SPeter Brune if (snes->ops->update) { 477eaedb033SPeter Brune ierr = (*snes->ops->update)(snes, snes->iter);CHKERRQ(ierr); 478eaedb033SPeter Brune } 479eaedb033SPeter Brune } 480eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION) { 481eaedb033SPeter Brune if (i == snes->max_its) { 482eaedb033SPeter Brune ierr = PetscInfo1(snes,"Maximum number of iterations has been reached: %D\n",snes->max_its);CHKERRQ(ierr); 483eaedb033SPeter Brune if (!snes->reason) snes->reason = SNES_DIVERGED_MAX_IT; 484eaedb033SPeter Brune } 4851aa26658SKarl Rupp } else if (!snes->reason) snes->reason = SNES_CONVERGED_ITS; /* NASM is meant to be used as a preconditioner */ 486eaedb033SPeter Brune PetscFunctionReturn(0); 487eaedb033SPeter Brune } 488eaedb033SPeter Brune 489eaedb033SPeter Brune /*MC 490eaedb033SPeter Brune SNESNASM - Nonlinear Additive Schwartz 491eaedb033SPeter Brune 492eaedb033SPeter Brune Level: advanced 493eaedb033SPeter Brune 494eaedb033SPeter Brune .seealso: SNESCreate(), SNES, SNESSetType(), SNESType (for list of available types) 495eaedb033SPeter Brune M*/ 496eaedb033SPeter Brune 497eaedb033SPeter Brune EXTERN_C_BEGIN 498eaedb033SPeter Brune #undef __FUNCT__ 499eaedb033SPeter Brune #define __FUNCT__ "SNESCreate_NASM" 500eaedb033SPeter Brune PetscErrorCode SNESCreate_NASM(SNES snes) 501eaedb033SPeter Brune { 502eaedb033SPeter Brune SNES_NASM *nasm; 503eaedb033SPeter Brune PetscErrorCode ierr; 504eaedb033SPeter Brune 505eaedb033SPeter Brune PetscFunctionBegin; 506eaedb033SPeter Brune ierr = PetscNewLog(snes, SNES_NASM, &nasm);CHKERRQ(ierr); 507eaedb033SPeter Brune snes->data = (void*)nasm; 508eaedb033SPeter Brune 509eaedb033SPeter Brune nasm->n = PETSC_DECIDE; 510eaedb033SPeter Brune nasm->subsnes = 0; 511eaedb033SPeter Brune nasm->x = 0; 512111ade9eSPeter Brune nasm->xl = 0; 513111ade9eSPeter Brune nasm->y = 0; 514eaedb033SPeter Brune nasm->b = 0; 515111ade9eSPeter Brune nasm->oscatter = 0; 516111ade9eSPeter Brune nasm->iscatter = 0; 517111ade9eSPeter Brune nasm->gscatter = 0; 518111ade9eSPeter Brune 519111ade9eSPeter Brune nasm->type = PC_ASM_BASIC; 520eaedb033SPeter Brune 521eaedb033SPeter Brune snes->ops->destroy = SNESDestroy_NASM; 522eaedb033SPeter Brune snes->ops->setup = SNESSetUp_NASM; 523eaedb033SPeter Brune snes->ops->setfromoptions = SNESSetFromOptions_NASM; 524eaedb033SPeter Brune snes->ops->view = SNESView_NASM; 525eaedb033SPeter Brune snes->ops->solve = SNESSolve_NASM; 526eaedb033SPeter Brune snes->ops->reset = SNESReset_NASM; 527eaedb033SPeter Brune 528eaedb033SPeter Brune snes->usesksp = PETSC_FALSE; 529eaedb033SPeter Brune snes->usespc = PETSC_FALSE; 530eaedb033SPeter Brune 5310298fd71SBarry Smith nasm->eventrestrictinterp = 0; 5320298fd71SBarry Smith nasm->eventsubsolve = 0; 533b20c023fSPeter Brune 534eaedb033SPeter Brune if (!snes->tolerancesset) { 535eaedb033SPeter Brune snes->max_its = 10000; 536eaedb033SPeter Brune snes->max_funcs = 10000; 537eaedb033SPeter Brune } 538eaedb033SPeter Brune 539eaedb033SPeter Brune ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMSetSubdomains_C","SNESNASMSetSubdomains_NASM", 540eaedb033SPeter Brune SNESNASMSetSubdomains_NASM);CHKERRQ(ierr); 541eaedb033SPeter Brune PetscFunctionReturn(0); 542eaedb033SPeter Brune } 543eaedb033SPeter Brune EXTERN_C_END 544