1eaedb033SPeter Brune #include <petsc-private/snesimpl.h> /*I "petscsnes.h" I*/ 2111ade9eSPeter Brune #include <petscdm.h> 3eaedb033SPeter Brune 4eaedb033SPeter Brune typedef struct { 5eaedb033SPeter Brune PetscInt n; /* local subdomains */ 6eaedb033SPeter Brune SNES *subsnes; /* nonlinear solvers for each subdomain */ 7eaedb033SPeter Brune Vec *x; /* solution vectors */ 8111ade9eSPeter Brune Vec *xl; /* solution local vectors */ 9111ade9eSPeter Brune Vec *y; /* step vectors */ 10eaedb033SPeter Brune Vec *b; /* rhs vectors */ 11111ade9eSPeter Brune VecScatter *oscatter; /* scatter from global space to the subdomain global space */ 12111ade9eSPeter Brune VecScatter *iscatter; /* scatter from global space to the nonoverlapping subdomain space */ 13111ade9eSPeter Brune VecScatter *gscatter; /* scatter from global space to the subdomain local space */ 14111ade9eSPeter Brune PCASMType type; /* ASM type */ 15111ade9eSPeter Brune PetscBool usesdm; /* use the DM for setting up the subproblems */ 16*d728fb7dSPeter Brune PetscBool finaljacobian; /* compute the jacobian of the converged solution */ 17b20c023fSPeter Brune 18b20c023fSPeter Brune /* logging events */ 19b20c023fSPeter Brune PetscLogEvent eventrestrictinterp; 20b20c023fSPeter Brune PetscLogEvent eventsubsolve; 21eaedb033SPeter Brune } SNES_NASM; 22eaedb033SPeter Brune 23b20c023fSPeter Brune const char *const SNESNASMTypes[] = {"NONE","RESTRICT","INTERPOLATE","BASIC","PCASMType","PC_ASM_",0}; 24b20c023fSPeter Brune 25eaedb033SPeter Brune #undef __FUNCT__ 26eaedb033SPeter Brune #define __FUNCT__ "SNESReset_NASM" 27eaedb033SPeter Brune PetscErrorCode SNESReset_NASM(SNES snes) 28eaedb033SPeter Brune { 29eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 30eaedb033SPeter Brune PetscErrorCode ierr; 31eaedb033SPeter Brune PetscInt i; 326e111a19SKarl Rupp 33eaedb033SPeter Brune PetscFunctionBegin; 34eaedb033SPeter Brune for (i=0; i<nasm->n; i++) { 35111ade9eSPeter Brune if (nasm->xl) { ierr = VecDestroy(&nasm->xl[i]);CHKERRQ(ierr); } 36f5f7c1b9SKarl Rupp if (nasm->x) { ierr = VecDestroy(&nasm->x[i]);CHKERRQ(ierr); } 37111ade9eSPeter Brune if (nasm->y) { ierr = VecDestroy(&nasm->y[i]);CHKERRQ(ierr); } 38bc8c1f72SJose Roman if (nasm->b) { ierr = VecDestroy(&nasm->b[i]);CHKERRQ(ierr); } 39eaedb033SPeter Brune 40bc8c1f72SJose Roman if (nasm->subsnes) { ierr = SNESDestroy(&nasm->subsnes[i]);CHKERRQ(ierr); } 41111ade9eSPeter Brune if (nasm->oscatter) { ierr = VecScatterDestroy(&nasm->oscatter[i]);CHKERRQ(ierr); } 42111ade9eSPeter Brune if (nasm->iscatter) { ierr = VecScatterDestroy(&nasm->iscatter[i]);CHKERRQ(ierr); } 43111ade9eSPeter Brune if (nasm->gscatter) { ierr = VecScatterDestroy(&nasm->gscatter[i]);CHKERRQ(ierr); } 44eaedb033SPeter Brune } 45111ade9eSPeter Brune 46111ade9eSPeter Brune if (nasm->x) {ierr = PetscFree(nasm->x);CHKERRQ(ierr);} 47111ade9eSPeter Brune if (nasm->xl) {ierr = PetscFree(nasm->xl);CHKERRQ(ierr);} 48111ade9eSPeter Brune if (nasm->y) {ierr = PetscFree(nasm->y);CHKERRQ(ierr);} 49111ade9eSPeter Brune if (nasm->b) {ierr = PetscFree(nasm->b);CHKERRQ(ierr);} 50111ade9eSPeter Brune 51111ade9eSPeter Brune if (nasm->subsnes) {ierr = PetscFree(nasm->subsnes);CHKERRQ(ierr);} 52111ade9eSPeter Brune if (nasm->oscatter) {ierr = PetscFree(nasm->oscatter);CHKERRQ(ierr);} 53111ade9eSPeter Brune if (nasm->iscatter) {ierr = PetscFree(nasm->iscatter);CHKERRQ(ierr);} 54111ade9eSPeter Brune if (nasm->gscatter) {ierr = PetscFree(nasm->gscatter);CHKERRQ(ierr);} 55b20c023fSPeter Brune 56b20c023fSPeter Brune nasm->eventrestrictinterp = 0; 57b20c023fSPeter Brune nasm->eventsubsolve = 0; 58eaedb033SPeter Brune PetscFunctionReturn(0); 59eaedb033SPeter Brune } 60eaedb033SPeter Brune 61eaedb033SPeter Brune #undef __FUNCT__ 62eaedb033SPeter Brune #define __FUNCT__ "SNESDestroy_NASM" 63eaedb033SPeter Brune PetscErrorCode SNESDestroy_NASM(SNES snes) 64eaedb033SPeter Brune { 65eaedb033SPeter Brune PetscErrorCode ierr; 666e111a19SKarl Rupp 67eaedb033SPeter Brune PetscFunctionBegin; 68eaedb033SPeter Brune ierr = SNESReset_NASM(snes);CHKERRQ(ierr); 6922d28d08SBarry Smith ierr = PetscFree(snes->data);CHKERRQ(ierr); 70eaedb033SPeter Brune PetscFunctionReturn(0); 71eaedb033SPeter Brune } 72eaedb033SPeter Brune 73eaedb033SPeter Brune #undef __FUNCT__ 74111ade9eSPeter Brune #define __FUNCT__ "DMGlobalToLocalSubDomainDirichletHook_Private" 750adebc6cSBarry Smith PetscErrorCode DMGlobalToLocalSubDomainDirichletHook_Private(DM dm,Vec g,InsertMode mode,Vec l,void *ctx) 760adebc6cSBarry Smith { 77111ade9eSPeter Brune PetscErrorCode ierr; 78111ade9eSPeter Brune Vec bcs = (Vec)ctx; 796e111a19SKarl Rupp 80111ade9eSPeter Brune PetscFunctionBegin; 81111ade9eSPeter Brune ierr = VecCopy(bcs,l);CHKERRQ(ierr); 82111ade9eSPeter Brune PetscFunctionReturn(0); 83111ade9eSPeter Brune } 84111ade9eSPeter Brune 85111ade9eSPeter Brune #undef __FUNCT__ 86eaedb033SPeter Brune #define __FUNCT__ "SNESSetUp_NASM" 87eaedb033SPeter Brune PetscErrorCode SNESSetUp_NASM(SNES snes) 88eaedb033SPeter Brune { 89eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 90eaedb033SPeter Brune PetscErrorCode ierr; 9176857b2aSPeter Brune DM dm,subdm; 92111ade9eSPeter Brune DM *subdms; 93111ade9eSPeter Brune PetscInt i; 94eaedb033SPeter Brune const char *optionsprefix; 95111ade9eSPeter Brune Vec F; 96eaedb033SPeter Brune 97eaedb033SPeter Brune PetscFunctionBegin; 98eaedb033SPeter Brune if (!nasm->subsnes) { 99eaedb033SPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 1000a696f66SPeter Brune if (dm) { 101eaedb033SPeter Brune nasm->usesdm = PETSC_TRUE; 1020298fd71SBarry Smith ierr = DMCreateDomainDecomposition(dm,&nasm->n,NULL,NULL,NULL,&subdms);CHKERRQ(ierr); 103ce94432eSBarry Smith if (!subdms) SETERRQ(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_WRONGSTATE,"DM has no default decomposition defined. Set subsolves manually with SNESNASMSetSubdomains()."); 104111ade9eSPeter Brune ierr = DMCreateDomainDecompositionScatters(dm,nasm->n,subdms,&nasm->iscatter,&nasm->oscatter,&nasm->gscatter);CHKERRQ(ierr); 105eaedb033SPeter Brune 106eaedb033SPeter Brune ierr = SNESGetOptionsPrefix(snes, &optionsprefix);CHKERRQ(ierr); 107111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(SNES),&nasm->subsnes);CHKERRQ(ierr); 108111ade9eSPeter Brune 109111ade9eSPeter Brune for (i=0; i<nasm->n; i++) { 110cdb298fcSPeter Brune ierr = SNESCreate(PETSC_COMM_SELF,&nasm->subsnes[i]);CHKERRQ(ierr); 111cdb298fcSPeter Brune ierr = SNESAppendOptionsPrefix(nasm->subsnes[i],optionsprefix);CHKERRQ(ierr); 112cdb298fcSPeter Brune ierr = SNESAppendOptionsPrefix(nasm->subsnes[i],"sub_");CHKERRQ(ierr); 113cdb298fcSPeter Brune ierr = SNESSetDM(nasm->subsnes[i],subdms[i]);CHKERRQ(ierr); 114cdb298fcSPeter Brune ierr = SNESSetFromOptions(nasm->subsnes[i]);CHKERRQ(ierr); 115111ade9eSPeter Brune ierr = DMDestroy(&subdms[i]);CHKERRQ(ierr); 116111ade9eSPeter Brune } 117111ade9eSPeter Brune ierr = PetscFree(subdms);CHKERRQ(ierr); 118ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Cannot construct local problems automatically without a DM!"); 119ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Must set subproblems manually if there is no DM!"); 120111ade9eSPeter Brune /* allocate the global vectors */ 121111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->x);CHKERRQ(ierr); 122111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->xl);CHKERRQ(ierr); 123111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->y);CHKERRQ(ierr); 124111ade9eSPeter Brune ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->b);CHKERRQ(ierr); 125111ade9eSPeter Brune 126111ade9eSPeter Brune for (i=0; i<nasm->n; i++) { 1270298fd71SBarry Smith ierr = SNESGetFunction(nasm->subsnes[i],&F,NULL,NULL);CHKERRQ(ierr); 12876857b2aSPeter Brune if (!nasm->x[i]) {ierr = VecDuplicate(F,&nasm->x[i]);CHKERRQ(ierr);} 12976857b2aSPeter Brune if (!nasm->y[i]) {ierr = VecDuplicate(F,&nasm->y[i]);CHKERRQ(ierr);} 13076857b2aSPeter Brune if (!nasm->b[i]) {ierr = VecDuplicate(F,&nasm->b[i]);CHKERRQ(ierr);} 13176857b2aSPeter Brune if (!nasm->xl[i]) { 132111ade9eSPeter Brune ierr = SNESGetDM(nasm->subsnes[i],&subdm);CHKERRQ(ierr); 133111ade9eSPeter Brune ierr = DMCreateLocalVector(subdm,&nasm->xl[i]);CHKERRQ(ierr); 13476857b2aSPeter Brune } 1350298fd71SBarry Smith ierr = DMGlobalToLocalHookAdd(subdm,DMGlobalToLocalSubDomainDirichletHook_Private,NULL,nasm->xl[i]);CHKERRQ(ierr); 136111ade9eSPeter Brune } 137*d728fb7dSPeter Brune if (nasm->finaljacobian) {ierr = SNESSetUpMatrices(snes);CHKERRQ(ierr);} 138eaedb033SPeter Brune PetscFunctionReturn(0); 139eaedb033SPeter Brune } 140eaedb033SPeter Brune 141eaedb033SPeter Brune #undef __FUNCT__ 142eaedb033SPeter Brune #define __FUNCT__ "SNESSetFromOptions_NASM" 143eaedb033SPeter Brune PetscErrorCode SNESSetFromOptions_NASM(SNES snes) 144eaedb033SPeter Brune { 145eaedb033SPeter Brune PetscErrorCode ierr; 146111ade9eSPeter Brune PCASMType asmtype; 147b20c023fSPeter Brune PetscBool flg,monflg; 148111ade9eSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 1496e111a19SKarl Rupp 150eaedb033SPeter Brune PetscFunctionBegin; 151111ade9eSPeter Brune ierr = PetscOptionsHead("Nonlinear Additive Schwartz options");CHKERRQ(ierr); 152111ade9eSPeter Brune ierr = PetscOptionsEnum("-snes_nasm_type","Type of restriction/extension","",SNESNASMTypes,(PetscEnum)nasm->type,(PetscEnum*)&asmtype,&flg);CHKERRQ(ierr); 1531aa26658SKarl Rupp if (flg) nasm->type = asmtype; 154b20c023fSPeter Brune flg = PETSC_FALSE; 155b20c023fSPeter Brune monflg = PETSC_TRUE; 156b20c023fSPeter Brune ierr = PetscOptionsBool("-snes_nasm_log","Log times for subSNES solves and restriction","",monflg,&monflg,&flg);CHKERRQ(ierr); 157*d728fb7dSPeter Brune ierr = PetscOptionsBool("-snes_nasm_finaljacobian","Compute the global jacobian of the final iterate (for ASPIN)","",nasm->finaljacobian,&nasm->finaljacobian,NULL);CHKERRQ(ierr); 158b20c023fSPeter Brune if (flg) { 159b20c023fSPeter Brune ierr = PetscLogEventRegister("SNESNASMSubSolve",((PetscObject)snes)->classid,&nasm->eventsubsolve);CHKERRQ(ierr); 160b20c023fSPeter Brune ierr = PetscLogEventRegister("SNESNASMRestrict",((PetscObject)snes)->classid,&nasm->eventrestrictinterp);CHKERRQ(ierr); 161b20c023fSPeter Brune } 162eaedb033SPeter Brune ierr = PetscOptionsTail();CHKERRQ(ierr); 163eaedb033SPeter Brune PetscFunctionReturn(0); 164eaedb033SPeter Brune } 165eaedb033SPeter Brune 166eaedb033SPeter Brune #undef __FUNCT__ 167eaedb033SPeter Brune #define __FUNCT__ "SNESView_NASM" 168eaedb033SPeter Brune PetscErrorCode SNESView_NASM(SNES snes, PetscViewer viewer) 169eaedb033SPeter Brune { 170eaedb033SPeter Brune PetscFunctionBegin; 171b20c023fSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 172b20c023fSPeter Brune PetscErrorCode ierr; 173b20c023fSPeter Brune PetscMPIInt rank; 174b20c023fSPeter Brune PetscInt i,N; 175b20c023fSPeter Brune PetscBool iascii,isstring; 176b20c023fSPeter Brune PetscViewer sviewer; 177ce94432eSBarry Smith MPI_Comm comm; 178b20c023fSPeter Brune 179b20c023fSPeter Brune PetscFunctionBegin; 180ce94432eSBarry Smith ierr = PetscObjectGetComm((PetscObject)snes,&comm);CHKERRQ(ierr); 181b20c023fSPeter Brune ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 182b20c023fSPeter Brune ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERSTRING,&isstring);CHKERRQ(ierr); 183b20c023fSPeter Brune ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 184b20c023fSPeter Brune ierr = MPI_Reduce(&nasm->n,&N,1,MPIU_INT,MPIU_SUM,0,comm);CHKERRQ(ierr); 185b20c023fSPeter Brune if (iascii) { 186b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer, " Nonlinear Additive Schwarz: total subdomain blocks = %D\n",N);CHKERRQ(ierr); 187b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer," Nonlinear Additive Schwarz: restriction/interpolation type - %s\n",SNESNASMTypes[nasm->type]);CHKERRQ(ierr); 188b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer," Nonlinear Additive Schwarz: subSNES iterations: %D subKSP iterations: %D\n",SNESNASMTypes[nasm->type]);CHKERRQ(ierr); 189b20c023fSPeter Brune ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 190b20c023fSPeter Brune ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] number of local blocks = %D\n",(int)rank,nasm->n);CHKERRQ(ierr); 191b20c023fSPeter Brune ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 192b20c023fSPeter Brune ierr = PetscViewerASCIIPrintf(viewer," Local SNES objects:\n");CHKERRQ(ierr); 193b20c023fSPeter Brune ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 194b20c023fSPeter Brune if (!rank) { 195b20c023fSPeter Brune for (i=0; i<nasm->n; i++) { 196b20c023fSPeter Brune ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 197b20c023fSPeter Brune ierr = SNESView(nasm->subsnes[i],sviewer);CHKERRQ(ierr); 198b20c023fSPeter Brune ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 199b20c023fSPeter Brune } 200b20c023fSPeter Brune } 201b20c023fSPeter Brune ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 202b20c023fSPeter Brune ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 203b20c023fSPeter Brune ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 204b20c023fSPeter Brune } else if (isstring) { 205b20c023fSPeter Brune ierr = PetscViewerStringSPrintf(viewer," blocks=%D,type=%s",N,SNESNASMTypes[nasm->type]);CHKERRQ(ierr); 206b20c023fSPeter Brune ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 207b20c023fSPeter Brune if (nasm->subsnes && !rank) {ierr = SNESView(nasm->subsnes[0],sviewer);CHKERRQ(ierr);} 208b20c023fSPeter Brune ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 209b20c023fSPeter Brune } 210eaedb033SPeter Brune PetscFunctionReturn(0); 211eaedb033SPeter Brune } 212eaedb033SPeter Brune 213eaedb033SPeter Brune #undef __FUNCT__ 214eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSetSubdomains" 21576857b2aSPeter Brune /*@ 21676857b2aSPeter Brune SNESNASMSetSubdomains - Manually Set the context required to restrict and solve subdomain problems. 21776857b2aSPeter Brune 21876857b2aSPeter Brune Not Collective 21976857b2aSPeter Brune 22076857b2aSPeter Brune Input Parameters: 22176857b2aSPeter Brune + SNES - the SNES context 22276857b2aSPeter Brune . n - the number of local subdomains 22376857b2aSPeter Brune . subsnes - solvers defined on the local subdomains 22476857b2aSPeter Brune . iscatter - scatters into the nonoverlapping portions of the local subdomains 22576857b2aSPeter Brune . oscatter - scatters into the overlapping portions of the local subdomains 22676857b2aSPeter Brune - gscatter - scatters into the (ghosted) local vector of the local subdomain 22776857b2aSPeter Brune 22876857b2aSPeter Brune Level: intermediate 22976857b2aSPeter Brune 23076857b2aSPeter Brune .keywords: SNES, NASM 23176857b2aSPeter Brune 23276857b2aSPeter Brune .seealso: SNESNASM, SNESNASMGetSubdomains() 23376857b2aSPeter Brune @*/ 234a6dfd86eSKarl Rupp PetscErrorCode SNESNASMSetSubdomains(SNES snes,PetscInt n,SNES subsnes[],VecScatter iscatter[],VecScatter oscatter[],VecScatter gscatter[]) 235a6dfd86eSKarl Rupp { 236eaedb033SPeter Brune PetscErrorCode ierr; 237111ade9eSPeter Brune PetscErrorCode (*f)(SNES,PetscInt,SNES*,VecScatter*,VecScatter*,VecScatter*); 2386e111a19SKarl Rupp 239eaedb033SPeter Brune PetscFunctionBegin; 240eaedb033SPeter Brune ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMSetSubdomains_C",(void (**)(void))&f);CHKERRQ(ierr); 241111ade9eSPeter Brune ierr = (f)(snes,n,subsnes,iscatter,oscatter,gscatter);CHKERRQ(ierr); 242eaedb033SPeter Brune PetscFunctionReturn(0); 243eaedb033SPeter Brune } 244eaedb033SPeter Brune 245eaedb033SPeter Brune EXTERN_C_BEGIN 246eaedb033SPeter Brune #undef __FUNCT__ 247eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSetSubdomains_NASM" 248a6dfd86eSKarl Rupp PetscErrorCode SNESNASMSetSubdomains_NASM(SNES snes,PetscInt n,SNES subsnes[],VecScatter iscatter[],VecScatter oscatter[],VecScatter gscatter[]) 249a6dfd86eSKarl Rupp { 250eaedb033SPeter Brune PetscInt i; 251eaedb033SPeter Brune PetscErrorCode ierr; 252eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 2536e111a19SKarl Rupp 254eaedb033SPeter Brune PetscFunctionBegin; 255ce94432eSBarry Smith if (snes->setupcalled) SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"SNESNASMSetSubdomains() should be called before calling SNESSetUp()."); 256eaedb033SPeter Brune 257111ade9eSPeter Brune /* tear down the previously set things */ 258111ade9eSPeter Brune ierr = SNESReset(snes);CHKERRQ(ierr); 259111ade9eSPeter Brune 260eaedb033SPeter Brune nasm->n = n; 261111ade9eSPeter Brune if (oscatter) { 262111ade9eSPeter Brune for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)oscatter[i]);CHKERRQ(ierr);} 263eaedb033SPeter Brune } 264111ade9eSPeter Brune if (iscatter) { 265111ade9eSPeter Brune for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)iscatter[i]);CHKERRQ(ierr);} 266eaedb033SPeter Brune } 267111ade9eSPeter Brune if (gscatter) { 268111ade9eSPeter Brune for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)gscatter[i]);CHKERRQ(ierr);} 269111ade9eSPeter Brune } 270111ade9eSPeter Brune if (oscatter) { 271111ade9eSPeter Brune ierr = PetscMalloc(n*sizeof(IS),&nasm->oscatter);CHKERRQ(ierr); 272eaedb033SPeter Brune for (i=0; i<n; i++) { 273111ade9eSPeter Brune nasm->oscatter[i] = oscatter[i]; 274eaedb033SPeter Brune } 275111ade9eSPeter Brune } 276111ade9eSPeter Brune if (iscatter) { 277111ade9eSPeter Brune ierr = PetscMalloc(n*sizeof(IS),&nasm->iscatter);CHKERRQ(ierr); 278eaedb033SPeter Brune for (i=0; i<n; i++) { 279111ade9eSPeter Brune nasm->iscatter[i] = iscatter[i]; 280eaedb033SPeter Brune } 281eaedb033SPeter Brune } 282111ade9eSPeter Brune if (gscatter) { 283111ade9eSPeter Brune ierr = PetscMalloc(n*sizeof(IS),&nasm->gscatter);CHKERRQ(ierr); 284eaedb033SPeter Brune for (i=0; i<n; i++) { 285111ade9eSPeter Brune nasm->gscatter[i] = gscatter[i]; 286eaedb033SPeter Brune } 287eaedb033SPeter Brune } 288111ade9eSPeter Brune 289eaedb033SPeter Brune if (subsnes) { 290eaedb033SPeter Brune ierr = PetscMalloc(n*sizeof(SNES),&nasm->subsnes);CHKERRQ(ierr); 291eaedb033SPeter Brune for (i=0; i<n; i++) { 292eaedb033SPeter Brune nasm->subsnes[i] = subsnes[i]; 293eaedb033SPeter Brune } 294eaedb033SPeter Brune } 295eaedb033SPeter Brune PetscFunctionReturn(0); 296eaedb033SPeter Brune } 297eaedb033SPeter Brune EXTERN_C_END 298eaedb033SPeter Brune 299eaedb033SPeter Brune #undef __FUNCT__ 30076857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomains" 30176857b2aSPeter Brune /*@ 30276857b2aSPeter Brune SNESNASMGetSubdomains - Get the local subdomain context. 30376857b2aSPeter Brune 30476857b2aSPeter Brune Not Collective 30576857b2aSPeter Brune 30676857b2aSPeter Brune Input Parameters: 30776857b2aSPeter Brune . SNES - the SNES context 30876857b2aSPeter Brune 30976857b2aSPeter Brune Output Parameters: 31076857b2aSPeter Brune + n - the number of local subdomains 31176857b2aSPeter Brune . subsnes - solvers defined on the local subdomains 31276857b2aSPeter Brune . iscatter - scatters into the nonoverlapping portions of the local subdomains 31376857b2aSPeter Brune . oscatter - scatters into the overlapping portions of the local subdomains 31476857b2aSPeter Brune - gscatter - scatters into the (ghosted) local vector of the local subdomain 31576857b2aSPeter Brune 31676857b2aSPeter Brune Level: intermediate 31776857b2aSPeter Brune 31876857b2aSPeter Brune .keywords: SNES, NASM 31976857b2aSPeter Brune 32076857b2aSPeter Brune .seealso: SNESNASM, SNESNASMSetSubdomains() 32176857b2aSPeter Brune @*/ 32276857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomains(SNES snes,PetscInt *n,SNES *subsnes[],VecScatter *iscatter[],VecScatter *oscatter[],VecScatter *gscatter[]) 32376857b2aSPeter Brune { 32476857b2aSPeter Brune PetscErrorCode ierr; 32576857b2aSPeter Brune PetscErrorCode (*f)(SNES,PetscInt*,SNES**,VecScatter**,VecScatter**,VecScatter**); 32676857b2aSPeter Brune 32776857b2aSPeter Brune PetscFunctionBegin; 32876857b2aSPeter Brune ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMGetSubdomains_C",(void (**)(void))&f);CHKERRQ(ierr); 32976857b2aSPeter Brune ierr = (f)(snes,n,subsnes,iscatter,oscatter,gscatter);CHKERRQ(ierr); 33076857b2aSPeter Brune PetscFunctionReturn(0); 33176857b2aSPeter Brune } 33276857b2aSPeter Brune 33376857b2aSPeter Brune EXTERN_C_BEGIN 33476857b2aSPeter Brune #undef __FUNCT__ 33576857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomains_NASM" 33676857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomains_NASM(SNES snes,PetscInt *n,SNES *subsnes[],VecScatter *iscatter[],VecScatter *oscatter[],VecScatter *gscatter[]) 33776857b2aSPeter Brune { 33876857b2aSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 33976857b2aSPeter Brune 34076857b2aSPeter Brune PetscFunctionBegin; 34176857b2aSPeter Brune if (n) *n = nasm->n; 34276857b2aSPeter Brune if (oscatter) *oscatter = nasm->oscatter; 34376857b2aSPeter Brune if (iscatter) *iscatter = nasm->iscatter; 34476857b2aSPeter Brune if (gscatter) *gscatter = nasm->gscatter; 34576857b2aSPeter Brune if (subsnes) *subsnes = nasm->subsnes; 34676857b2aSPeter Brune PetscFunctionReturn(0); 34776857b2aSPeter Brune } 34876857b2aSPeter Brune EXTERN_C_END 34976857b2aSPeter Brune 35076857b2aSPeter Brune #undef __FUNCT__ 35176857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomainVecs" 35276857b2aSPeter Brune /*@ 35376857b2aSPeter Brune SNESNASMGetSubdomainVecs - Get the processor-local subdomain vectors 35476857b2aSPeter Brune 35576857b2aSPeter Brune Not Collective 35676857b2aSPeter Brune 35776857b2aSPeter Brune Input Parameters: 35876857b2aSPeter Brune . SNES - the SNES context 35976857b2aSPeter Brune 36076857b2aSPeter Brune Output Parameters: 36176857b2aSPeter Brune + n - the number of local subdomains 36276857b2aSPeter Brune . x - The subdomain solution vector 36376857b2aSPeter Brune . y - The subdomain step vector 36476857b2aSPeter Brune . b - The subdomain RHS vector 36576857b2aSPeter Brune - xl - The subdomain local vectors (ghosted) 36676857b2aSPeter Brune 36776857b2aSPeter Brune Level: developer 36876857b2aSPeter Brune 36976857b2aSPeter Brune .keywords: SNES, NASM 37076857b2aSPeter Brune 37176857b2aSPeter Brune .seealso: SNESNASM, SNESNASMGetSubdomains() 37276857b2aSPeter Brune @*/ 37376857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomainVecs(SNES snes,PetscInt *n,Vec **x,Vec **y,Vec **b, Vec **xl) 37476857b2aSPeter Brune { 37576857b2aSPeter Brune PetscErrorCode ierr; 37676857b2aSPeter Brune PetscErrorCode (*f)(SNES,PetscInt*,Vec**,Vec**,Vec**,Vec**); 37776857b2aSPeter Brune 37876857b2aSPeter Brune PetscFunctionBegin; 37976857b2aSPeter Brune ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMGetSubdomainVecs_C",(void (**)(void))&f);CHKERRQ(ierr); 38076857b2aSPeter Brune ierr = (f)(snes,n,x,y,b,xl);CHKERRQ(ierr); 38176857b2aSPeter Brune PetscFunctionReturn(0); 38276857b2aSPeter Brune } 38376857b2aSPeter Brune 38476857b2aSPeter Brune EXTERN_C_BEGIN 38576857b2aSPeter Brune #undef __FUNCT__ 38676857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomainVecs_NASM" 38776857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomainVecs_NASM(SNES snes,PetscInt *n,Vec **x,Vec **y,Vec **b,Vec **xl) 38876857b2aSPeter Brune { 38976857b2aSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 39076857b2aSPeter Brune 39176857b2aSPeter Brune PetscFunctionBegin; 39276857b2aSPeter Brune if (n) *n = nasm->n; 39376857b2aSPeter Brune if (x) *x = nasm->x; 39476857b2aSPeter Brune if (y) *y = nasm->y; 39576857b2aSPeter Brune if (b) *b = nasm->b; 39676857b2aSPeter Brune if (xl) *xl = nasm->xl; 39776857b2aSPeter Brune PetscFunctionReturn(0); 39876857b2aSPeter Brune } 39976857b2aSPeter Brune EXTERN_C_END 40076857b2aSPeter Brune 401*d728fb7dSPeter Brune #undef __FUNCT__ 402*d728fb7dSPeter Brune #define __FUNCT__ "SNESNASMSetComputeFinalJacobian" 403*d728fb7dSPeter Brune /*@ 404*d728fb7dSPeter Brune SNESNASMSetComputeFinalJacobian - Schedules the computation of the global and subdomain jacobians upon convergence 405*d728fb7dSPeter Brune 406*d728fb7dSPeter Brune Collective on SNES 407*d728fb7dSPeter Brune 408*d728fb7dSPeter Brune Input Parameters: 409*d728fb7dSPeter Brune + SNES - the SNES context 410*d728fb7dSPeter Brune - flg - indication of whether to compute the jacobians or not 411*d728fb7dSPeter Brune 412*d728fb7dSPeter Brune Level: developer 413*d728fb7dSPeter Brune 414*d728fb7dSPeter Brune Notes: This is used almost exclusively in the implementation of ASPIN, where the converged subdomain and global jacobian 415*d728fb7dSPeter Brune is needed at each linear iteration. 416*d728fb7dSPeter Brune 417*d728fb7dSPeter Brune .keywords: SNES, NASM, ASPIN 418*d728fb7dSPeter Brune 419*d728fb7dSPeter Brune .seealso: SNESNASM, SNESNASMGetSubdomains() 420*d728fb7dSPeter Brune @*/ 421*d728fb7dSPeter Brune PetscErrorCode SNESNASMSetComputeFinalJacobian(SNES snes,PetscBool flg) 422*d728fb7dSPeter Brune { 423*d728fb7dSPeter Brune PetscErrorCode (*f)(SNES,PetscBool); 424*d728fb7dSPeter Brune PetscErrorCode ierr; 425*d728fb7dSPeter Brune 426*d728fb7dSPeter Brune PetscFunctionBegin; 427*d728fb7dSPeter Brune ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMSetComputeFinalJacobian_C",(void (**)(void))&f);CHKERRQ(ierr); 428*d728fb7dSPeter Brune ierr = (f)(snes,flg);CHKERRQ(ierr); 429*d728fb7dSPeter Brune PetscFunctionReturn(0); 430*d728fb7dSPeter Brune } 431*d728fb7dSPeter Brune 432*d728fb7dSPeter Brune EXTERN_C_BEGIN 433*d728fb7dSPeter Brune #undef __FUNCT__ 434*d728fb7dSPeter Brune #define __FUNCT__ "SNESNASMSetComputeFinalJacobian_NASM" 435*d728fb7dSPeter Brune PetscErrorCode SNESNASMSetComputeFinalJacobian_NASM(SNES snes,PetscBool flg) 436*d728fb7dSPeter Brune { 437*d728fb7dSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 438*d728fb7dSPeter Brune 439*d728fb7dSPeter Brune PetscFunctionBegin; 440*d728fb7dSPeter Brune nasm->finaljacobian = flg; 441*d728fb7dSPeter Brune PetscFunctionReturn(0); 442*d728fb7dSPeter Brune } 443*d728fb7dSPeter Brune EXTERN_C_END 444*d728fb7dSPeter Brune 44576857b2aSPeter Brune 44676857b2aSPeter Brune #undef __FUNCT__ 447eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSolveLocal_Private" 4480adebc6cSBarry Smith PetscErrorCode SNESNASMSolveLocal_Private(SNES snes,Vec B,Vec Y,Vec X) 4490adebc6cSBarry Smith { 450eaedb033SPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 451258e1594SPeter Brune SNES subsnes; 452eaedb033SPeter Brune PetscInt i; 453eaedb033SPeter Brune PetscErrorCode ierr; 454111ade9eSPeter Brune Vec Xlloc,Xl,Bl,Yl; 455111ade9eSPeter Brune VecScatter iscat,oscat,gscat; 456111ade9eSPeter Brune DM dm,subdm; 4570adebc6cSBarry Smith 458eaedb033SPeter Brune PetscFunctionBegin; 459eaedb033SPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 460111ade9eSPeter Brune ierr = VecSet(Y,0);CHKERRQ(ierr); 461b20c023fSPeter Brune 462b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 463eaedb033SPeter Brune for (i=0; i<nasm->n; i++) { 46470c78f05SPeter Brune /* scatter the solution to the local solution */ 46570c78f05SPeter Brune Xlloc = nasm->xl[i]; 46670c78f05SPeter Brune gscat = nasm->gscatter[i]; 46770c78f05SPeter Brune oscat = nasm->oscatter[i]; 46870c78f05SPeter Brune ierr = VecScatterBegin(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 46970c78f05SPeter Brune if (B) { 47070c78f05SPeter Brune /* scatter the RHS to the local RHS */ 47170c78f05SPeter Brune Bl = nasm->b[i]; 47270c78f05SPeter Brune ierr = VecScatterBegin(oscat,B,Bl,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47370c78f05SPeter Brune } 47470c78f05SPeter Brune } 475b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 476b20c023fSPeter Brune 47770c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 47870c78f05SPeter Brune Xlloc = nasm->xl[i]; 479d590fa63SPeter Brune gscat = nasm->gscatter[i]; 480d590fa63SPeter Brune oscat = nasm->oscatter[i]; 48170c78f05SPeter Brune ierr = VecScatterEnd(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 48270c78f05SPeter Brune if (B) { 48324b7f281SPeter Brune Bl = nasm->b[i]; 48470c78f05SPeter Brune ierr = VecScatterEnd(oscat,B,Bl,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 48570c78f05SPeter Brune } 48670c78f05SPeter Brune } 487b20c023fSPeter Brune 488b20c023fSPeter Brune if (nasm->eventsubsolve) {ierr = PetscLogEventBegin(nasm->eventsubsolve,snes,0,0,0);CHKERRQ(ierr);} 48970c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 49070c78f05SPeter Brune Xl = nasm->x[i]; 49170c78f05SPeter Brune Xlloc = nasm->xl[i]; 49270c78f05SPeter Brune Yl = nasm->y[i]; 493258e1594SPeter Brune subsnes = nasm->subsnes[i]; 494258e1594SPeter Brune ierr = SNESGetDM(subsnes,&subdm);CHKERRQ(ierr); 495111ade9eSPeter Brune iscat = nasm->iscatter[i]; 496111ade9eSPeter Brune oscat = nasm->oscatter[i]; 497111ade9eSPeter Brune gscat = nasm->gscatter[i]; 498111ade9eSPeter Brune ierr = DMSubDomainRestrict(dm,oscat,gscat,subdm);CHKERRQ(ierr); 49924b7f281SPeter Brune if (B) { 50024b7f281SPeter Brune Bl = nasm->b[i]; 50124b7f281SPeter Brune } else { 50224b7f281SPeter Brune Bl = NULL; 50324b7f281SPeter Brune } 50470c78f05SPeter Brune ierr = DMLocalToGlobalBegin(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr); 50570c78f05SPeter Brune ierr = DMLocalToGlobalEnd(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr); 506111ade9eSPeter Brune ierr = VecCopy(Xl,Yl);CHKERRQ(ierr); 507258e1594SPeter Brune ierr = SNESSolve(subsnes,Bl,Yl);CHKERRQ(ierr); 508111ade9eSPeter Brune ierr = VecAXPY(Yl,-1.0,Xl);CHKERRQ(ierr); 50970c78f05SPeter Brune } 510b20c023fSPeter Brune if (nasm->eventsubsolve) {ierr = PetscLogEventEnd(nasm->eventsubsolve,snes,0,0,0);CHKERRQ(ierr);} 511111ade9eSPeter Brune 512ce94432eSBarry Smith ierr = MPI_Barrier(PetscObjectComm((PetscObject)snes));CHKERRQ(ierr); 51370c78f05SPeter Brune 514b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 51570c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 51670c78f05SPeter Brune Yl = nasm->y[i]; 51770c78f05SPeter Brune iscat = nasm->iscatter[i]; 51870c78f05SPeter Brune oscat = nasm->oscatter[i]; 519111ade9eSPeter Brune if (nasm->type == PC_ASM_BASIC) { 520111ade9eSPeter Brune ierr = VecScatterBegin(oscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 521111ade9eSPeter Brune } else if (nasm->type == PC_ASM_RESTRICT) { 522111ade9eSPeter Brune ierr = VecScatterBegin(iscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 523ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Only basic and restrict types are supported for SNESNASM"); 524eaedb033SPeter Brune } 525eaedb033SPeter Brune 52670c78f05SPeter Brune for (i=0; i<nasm->n; i++) { 52770c78f05SPeter Brune Yl = nasm->y[i]; 52870c78f05SPeter Brune iscat = nasm->iscatter[i]; 52970c78f05SPeter Brune oscat = nasm->oscatter[i]; 53070c78f05SPeter Brune if (nasm->type == PC_ASM_BASIC) { 53170c78f05SPeter Brune ierr = VecScatterEnd(oscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 53270c78f05SPeter Brune } else if (nasm->type == PC_ASM_RESTRICT) { 53370c78f05SPeter Brune ierr = VecScatterEnd(iscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 534ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Only basic and restrict types are supported for SNESNASM"); 53570c78f05SPeter Brune } 536b20c023fSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 53770c78f05SPeter Brune 538ce94432eSBarry Smith ierr = MPI_Barrier(PetscObjectComm((PetscObject)snes));CHKERRQ(ierr); 539cd939e56SPeter Brune 540111ade9eSPeter Brune ierr = VecAXPY(X,1.0,Y);CHKERRQ(ierr); 541eaedb033SPeter Brune PetscFunctionReturn(0); 542eaedb033SPeter Brune } 543eaedb033SPeter Brune 544eaedb033SPeter Brune #undef __FUNCT__ 545*d728fb7dSPeter Brune #define __FUNCT__ "SNESNASMComputeFinalJacobian_Private" 546*d728fb7dSPeter Brune PetscErrorCode SNESNASMComputeFinalJacobian_Private(SNES snes, Vec X) 547*d728fb7dSPeter Brune { 548*d728fb7dSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 549*d728fb7dSPeter Brune SNES subsnes; 550*d728fb7dSPeter Brune PetscInt i; 551*d728fb7dSPeter Brune PetscErrorCode ierr; 552*d728fb7dSPeter Brune Vec Xlloc,Xl; 553*d728fb7dSPeter Brune VecScatter oscat,gscat; 554*d728fb7dSPeter Brune DM dm,subdm; 555*d728fb7dSPeter Brune MatStructure flg = DIFFERENT_NONZERO_PATTERN; 556*d728fb7dSPeter Brune 557*d728fb7dSPeter Brune PetscFunctionBegin; 558*d728fb7dSPeter Brune ierr = SNESComputeJacobian(snes,X,&snes->jacobian,&snes->jacobian_pre,&flg);CHKERRQ(ierr); 559*d728fb7dSPeter Brune ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr); 560*d728fb7dSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 561*d728fb7dSPeter Brune for (i=0; i<nasm->n; i++) { 562*d728fb7dSPeter Brune /* scatter the solution to the local solution */ 563*d728fb7dSPeter Brune Xlloc = nasm->xl[i]; 564*d728fb7dSPeter Brune gscat = nasm->gscatter[i]; 565*d728fb7dSPeter Brune oscat = nasm->oscatter[i]; 566*d728fb7dSPeter Brune ierr = VecScatterBegin(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 567*d728fb7dSPeter Brune } 568*d728fb7dSPeter Brune if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);} 569*d728fb7dSPeter Brune 570*d728fb7dSPeter Brune for (i=0; i<nasm->n; i++) { 571*d728fb7dSPeter Brune Xlloc = nasm->xl[i]; 572*d728fb7dSPeter Brune gscat = nasm->gscatter[i]; 573*d728fb7dSPeter Brune oscat = nasm->oscatter[i]; 574*d728fb7dSPeter Brune ierr = VecScatterEnd(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 575*d728fb7dSPeter Brune } 576*d728fb7dSPeter Brune 577*d728fb7dSPeter Brune for (i=0; i<nasm->n; i++) { 578*d728fb7dSPeter Brune Xl = nasm->x[i]; 579*d728fb7dSPeter Brune Xlloc = nasm->xl[i]; 580*d728fb7dSPeter Brune subsnes = nasm->subsnes[i]; 581*d728fb7dSPeter Brune ierr = SNESGetDM(subsnes,&subdm);CHKERRQ(ierr); 582*d728fb7dSPeter Brune oscat = nasm->oscatter[i]; 583*d728fb7dSPeter Brune gscat = nasm->gscatter[i]; 584*d728fb7dSPeter Brune ierr = DMSubDomainRestrict(dm,oscat,gscat,subdm);CHKERRQ(ierr); 585*d728fb7dSPeter Brune ierr = DMLocalToGlobalBegin(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr); 586*d728fb7dSPeter Brune ierr = DMLocalToGlobalEnd(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr); 587*d728fb7dSPeter Brune ierr = SNESComputeJacobian(subsnes,Xl,&snes->jacobian,&subsnes->jacobian_pre,&flg);CHKERRQ(ierr); 588*d728fb7dSPeter Brune ierr = KSPSetOperators(subsnes->ksp,subsnes->jacobian,subsnes->jacobian_pre,flg);CHKERRQ(ierr); 589*d728fb7dSPeter Brune } 590*d728fb7dSPeter Brune 591*d728fb7dSPeter Brune ierr = MPI_Barrier(PetscObjectComm((PetscObject)snes));CHKERRQ(ierr); 592*d728fb7dSPeter Brune PetscFunctionReturn(0); 593*d728fb7dSPeter Brune } 594*d728fb7dSPeter Brune 595*d728fb7dSPeter Brune #undef __FUNCT__ 596eaedb033SPeter Brune #define __FUNCT__ "SNESSolve_NASM" 597eaedb033SPeter Brune PetscErrorCode SNESSolve_NASM(SNES snes) 598eaedb033SPeter Brune { 599eaedb033SPeter Brune Vec F; 600eaedb033SPeter Brune Vec X; 601eaedb033SPeter Brune Vec B; 602111ade9eSPeter Brune Vec Y; 603eaedb033SPeter Brune PetscInt i; 604eaedb033SPeter Brune PetscReal fnorm; 605eaedb033SPeter Brune PetscErrorCode ierr; 606eaedb033SPeter Brune SNESNormType normtype; 607*d728fb7dSPeter Brune SNES_NASM *nasm = (SNES_NASM*)snes->data; 608eaedb033SPeter Brune 609eaedb033SPeter Brune PetscFunctionBegin; 610eaedb033SPeter Brune X = snes->vec_sol; 611111ade9eSPeter Brune Y = snes->vec_sol_update; 612eaedb033SPeter Brune F = snes->vec_func; 613eaedb033SPeter Brune B = snes->vec_rhs; 614eaedb033SPeter Brune 615eaedb033SPeter Brune ierr = PetscObjectTakeAccess(snes);CHKERRQ(ierr); 616eaedb033SPeter Brune snes->iter = 0; 617eaedb033SPeter Brune snes->norm = 0.; 618eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 619eaedb033SPeter Brune snes->reason = SNES_CONVERGED_ITERATING; 620eaedb033SPeter Brune ierr = SNESGetNormType(snes, &normtype);CHKERRQ(ierr); 621eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION || normtype == SNES_NORM_INITIAL_ONLY || normtype == SNES_NORM_INITIAL_FINAL_ONLY) { 622eaedb033SPeter Brune /* compute the initial function and preconditioned update delX */ 623eaedb033SPeter Brune if (!snes->vec_func_init_set) { 624eaedb033SPeter Brune ierr = SNESComputeFunction(snes,X,F);CHKERRQ(ierr); 625eaedb033SPeter Brune if (snes->domainerror) { 626eaedb033SPeter Brune snes->reason = SNES_DIVERGED_FUNCTION_DOMAIN; 627eaedb033SPeter Brune PetscFunctionReturn(0); 628eaedb033SPeter Brune } 6291aa26658SKarl Rupp } else snes->vec_func_init_set = PETSC_FALSE; 630eaedb033SPeter Brune 631eaedb033SPeter Brune /* convergence test */ 632eaedb033SPeter Brune if (!snes->norm_init_set) { 633eaedb033SPeter Brune ierr = VecNorm(F, NORM_2, &fnorm);CHKERRQ(ierr); /* fnorm <- ||F|| */ 634eaedb033SPeter Brune if (PetscIsInfOrNanReal(fnorm)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FP,"Infinite or not-a-number generated in norm"); 635eaedb033SPeter Brune } else { 636eaedb033SPeter Brune fnorm = snes->norm_init; 637eaedb033SPeter Brune snes->norm_init_set = PETSC_FALSE; 638eaedb033SPeter Brune } 639eaedb033SPeter Brune ierr = PetscObjectTakeAccess(snes);CHKERRQ(ierr); 640eaedb033SPeter Brune snes->iter = 0; 641eaedb033SPeter Brune snes->norm = fnorm; 642eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 643a71f0d7dSBarry Smith ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr); 644eaedb033SPeter Brune ierr = SNESMonitor(snes,0,snes->norm);CHKERRQ(ierr); 645eaedb033SPeter Brune 646eaedb033SPeter Brune /* set parameter for default relative tolerance convergence test */ 647eaedb033SPeter Brune snes->ttol = fnorm*snes->rtol; 648eaedb033SPeter Brune 649eaedb033SPeter Brune /* test convergence */ 650eaedb033SPeter Brune ierr = (*snes->ops->converged)(snes,0,0.0,0.0,fnorm,&snes->reason,snes->cnvP);CHKERRQ(ierr); 651eaedb033SPeter Brune if (snes->reason) PetscFunctionReturn(0); 652eaedb033SPeter Brune } else { 653eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 654a71f0d7dSBarry Smith ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr); 655eaedb033SPeter Brune ierr = SNESMonitor(snes,0,snes->norm);CHKERRQ(ierr); 656eaedb033SPeter Brune } 657eaedb033SPeter Brune 658eaedb033SPeter Brune /* Call general purpose update function */ 659eaedb033SPeter Brune if (snes->ops->update) { 660eaedb033SPeter Brune ierr = (*snes->ops->update)(snes, snes->iter);CHKERRQ(ierr); 661eaedb033SPeter Brune } 662eaedb033SPeter Brune 663eaedb033SPeter Brune for (i = 0; i < snes->max_its; i++) { 664111ade9eSPeter Brune ierr = SNESNASMSolveLocal_Private(snes,B,Y,X);CHKERRQ(ierr); 665eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION || ((i == snes->max_its - 1) && (normtype == SNES_NORM_INITIAL_FINAL_ONLY || normtype == SNES_NORM_FINAL_ONLY))) { 666eaedb033SPeter Brune ierr = SNESComputeFunction(snes,X,F);CHKERRQ(ierr); 667eaedb033SPeter Brune if (snes->domainerror) { 668eaedb033SPeter Brune snes->reason = SNES_DIVERGED_FUNCTION_DOMAIN; 669*d728fb7dSPeter Brune break; 670eaedb033SPeter Brune } 671eaedb033SPeter Brune ierr = VecNorm(F, NORM_2, &fnorm);CHKERRQ(ierr); /* fnorm <- ||F|| */ 672eaedb033SPeter Brune if (PetscIsInfOrNanReal(fnorm)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FP,"Infinite or not-a-number generated in norm"); 673eaedb033SPeter Brune } 674eaedb033SPeter Brune /* Monitor convergence */ 675eaedb033SPeter Brune ierr = PetscObjectTakeAccess(snes);CHKERRQ(ierr); 676eaedb033SPeter Brune snes->iter = i+1; 677eaedb033SPeter Brune snes->norm = fnorm; 678eaedb033SPeter Brune ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr); 679a71f0d7dSBarry Smith ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr); 680eaedb033SPeter Brune ierr = SNESMonitor(snes,snes->iter,snes->norm);CHKERRQ(ierr); 681eaedb033SPeter Brune /* Test for convergence */ 682eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION) ierr = (*snes->ops->converged)(snes,snes->iter,0.0,0.0,fnorm,&snes->reason,snes->cnvP);CHKERRQ(ierr); 683*d728fb7dSPeter Brune if (snes->reason) break; 684eaedb033SPeter Brune /* Call general purpose update function */ 685eaedb033SPeter Brune if (snes->ops->update) { 686eaedb033SPeter Brune ierr = (*snes->ops->update)(snes, snes->iter);CHKERRQ(ierr); 687eaedb033SPeter Brune } 688eaedb033SPeter Brune } 689*d728fb7dSPeter Brune if (nasm->finaljacobian) {ierr = SNESNASMComputeFinalJacobian_Private(snes,X);CHKERRQ(ierr);} 690eaedb033SPeter Brune if (normtype == SNES_NORM_FUNCTION) { 691eaedb033SPeter Brune if (i == snes->max_its) { 692eaedb033SPeter Brune ierr = PetscInfo1(snes,"Maximum number of iterations has been reached: %D\n",snes->max_its);CHKERRQ(ierr); 693eaedb033SPeter Brune if (!snes->reason) snes->reason = SNES_DIVERGED_MAX_IT; 694eaedb033SPeter Brune } 6951aa26658SKarl Rupp } else if (!snes->reason) snes->reason = SNES_CONVERGED_ITS; /* NASM is meant to be used as a preconditioner */ 696eaedb033SPeter Brune PetscFunctionReturn(0); 697eaedb033SPeter Brune } 698eaedb033SPeter Brune 699eaedb033SPeter Brune /*MC 700eaedb033SPeter Brune SNESNASM - Nonlinear Additive Schwartz 701eaedb033SPeter Brune 702eaedb033SPeter Brune Level: advanced 703eaedb033SPeter Brune 704eaedb033SPeter Brune .seealso: SNESCreate(), SNES, SNESSetType(), SNESType (for list of available types) 705eaedb033SPeter Brune M*/ 706eaedb033SPeter Brune 707eaedb033SPeter Brune EXTERN_C_BEGIN 708eaedb033SPeter Brune #undef __FUNCT__ 709eaedb033SPeter Brune #define __FUNCT__ "SNESCreate_NASM" 710eaedb033SPeter Brune PetscErrorCode SNESCreate_NASM(SNES snes) 711eaedb033SPeter Brune { 712eaedb033SPeter Brune SNES_NASM *nasm; 713eaedb033SPeter Brune PetscErrorCode ierr; 714eaedb033SPeter Brune 715eaedb033SPeter Brune PetscFunctionBegin; 716eaedb033SPeter Brune ierr = PetscNewLog(snes, SNES_NASM, &nasm);CHKERRQ(ierr); 717eaedb033SPeter Brune snes->data = (void*)nasm; 718eaedb033SPeter Brune 719eaedb033SPeter Brune nasm->n = PETSC_DECIDE; 720eaedb033SPeter Brune nasm->subsnes = 0; 721eaedb033SPeter Brune nasm->x = 0; 722111ade9eSPeter Brune nasm->xl = 0; 723111ade9eSPeter Brune nasm->y = 0; 724eaedb033SPeter Brune nasm->b = 0; 725111ade9eSPeter Brune nasm->oscatter = 0; 726111ade9eSPeter Brune nasm->iscatter = 0; 727111ade9eSPeter Brune nasm->gscatter = 0; 728111ade9eSPeter Brune 729111ade9eSPeter Brune nasm->type = PC_ASM_BASIC; 730*d728fb7dSPeter Brune nasm->finaljacobian = PETSC_FALSE; 731eaedb033SPeter Brune 732eaedb033SPeter Brune snes->ops->destroy = SNESDestroy_NASM; 733eaedb033SPeter Brune snes->ops->setup = SNESSetUp_NASM; 734eaedb033SPeter Brune snes->ops->setfromoptions = SNESSetFromOptions_NASM; 735eaedb033SPeter Brune snes->ops->view = SNESView_NASM; 736eaedb033SPeter Brune snes->ops->solve = SNESSolve_NASM; 737eaedb033SPeter Brune snes->ops->reset = SNESReset_NASM; 738eaedb033SPeter Brune 739eaedb033SPeter Brune snes->usesksp = PETSC_FALSE; 740eaedb033SPeter Brune snes->usespc = PETSC_FALSE; 741eaedb033SPeter Brune 7420298fd71SBarry Smith nasm->eventrestrictinterp = 0; 7430298fd71SBarry Smith nasm->eventsubsolve = 0; 744b20c023fSPeter Brune 745eaedb033SPeter Brune if (!snes->tolerancesset) { 746eaedb033SPeter Brune snes->max_its = 10000; 747eaedb033SPeter Brune snes->max_funcs = 10000; 748eaedb033SPeter Brune } 749eaedb033SPeter Brune 750eaedb033SPeter Brune ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMSetSubdomains_C","SNESNASMSetSubdomains_NASM", 751eaedb033SPeter Brune SNESNASMSetSubdomains_NASM);CHKERRQ(ierr); 75276857b2aSPeter Brune ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMGetSubdomains_C","SNESNASMGetSubdomains_NASM", 75376857b2aSPeter Brune SNESNASMGetSubdomains_NASM);CHKERRQ(ierr); 75476857b2aSPeter Brune ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMGetSubdomainVecs_C","SNESNASMGetSubdomainVecs_NASM", 75576857b2aSPeter Brune SNESNASMGetSubdomainVecs_NASM);CHKERRQ(ierr); 756*d728fb7dSPeter Brune ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMSetComputeFinalJacobian_C","SNESNASMSetComputeFinalJacobian_NASM", 757*d728fb7dSPeter Brune SNESNASMSetComputeFinalJacobian_NASM);CHKERRQ(ierr); 758eaedb033SPeter Brune PetscFunctionReturn(0); 759eaedb033SPeter Brune } 760eaedb033SPeter Brune EXTERN_C_END 761