xref: /petsc/src/snes/impls/nasm/nasm.c (revision d728fb7dff1ad61d29df6dcab893bdd59c1da584)
1eaedb033SPeter Brune #include <petsc-private/snesimpl.h>             /*I   "petscsnes.h"   I*/
2111ade9eSPeter Brune #include <petscdm.h>
3eaedb033SPeter Brune 
4eaedb033SPeter Brune typedef struct {
5eaedb033SPeter Brune   PetscInt   n;                   /* local subdomains */
6eaedb033SPeter Brune   SNES       *subsnes;            /* nonlinear solvers for each subdomain */
7eaedb033SPeter Brune   Vec        *x;                  /* solution vectors */
8111ade9eSPeter Brune   Vec        *xl;                 /* solution local vectors */
9111ade9eSPeter Brune   Vec        *y;                  /* step vectors */
10eaedb033SPeter Brune   Vec        *b;                  /* rhs vectors */
11111ade9eSPeter Brune   VecScatter *oscatter;           /* scatter from global space to the subdomain global space */
12111ade9eSPeter Brune   VecScatter *iscatter;           /* scatter from global space to the nonoverlapping subdomain space */
13111ade9eSPeter Brune   VecScatter *gscatter;           /* scatter from global space to the subdomain local space */
14111ade9eSPeter Brune   PCASMType  type;                /* ASM type */
15111ade9eSPeter Brune   PetscBool  usesdm;              /* use the DM for setting up the subproblems */
16*d728fb7dSPeter Brune   PetscBool  finaljacobian;       /* compute the jacobian of the converged solution */
17b20c023fSPeter Brune 
18b20c023fSPeter Brune   /* logging events */
19b20c023fSPeter Brune   PetscLogEvent eventrestrictinterp;
20b20c023fSPeter Brune   PetscLogEvent eventsubsolve;
21eaedb033SPeter Brune } SNES_NASM;
22eaedb033SPeter Brune 
23b20c023fSPeter Brune const char *const SNESNASMTypes[] = {"NONE","RESTRICT","INTERPOLATE","BASIC","PCASMType","PC_ASM_",0};
24b20c023fSPeter Brune 
25eaedb033SPeter Brune #undef __FUNCT__
26eaedb033SPeter Brune #define __FUNCT__ "SNESReset_NASM"
27eaedb033SPeter Brune PetscErrorCode SNESReset_NASM(SNES snes)
28eaedb033SPeter Brune {
29eaedb033SPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
30eaedb033SPeter Brune   PetscErrorCode ierr;
31eaedb033SPeter Brune   PetscInt       i;
326e111a19SKarl Rupp 
33eaedb033SPeter Brune   PetscFunctionBegin;
34eaedb033SPeter Brune   for (i=0; i<nasm->n; i++) {
35111ade9eSPeter Brune     if (nasm->xl) { ierr = VecDestroy(&nasm->xl[i]);CHKERRQ(ierr); }
36f5f7c1b9SKarl Rupp     if (nasm->x) { ierr = VecDestroy(&nasm->x[i]);CHKERRQ(ierr); }
37111ade9eSPeter Brune     if (nasm->y) { ierr = VecDestroy(&nasm->y[i]);CHKERRQ(ierr); }
38bc8c1f72SJose Roman     if (nasm->b) { ierr = VecDestroy(&nasm->b[i]);CHKERRQ(ierr); }
39eaedb033SPeter Brune 
40bc8c1f72SJose Roman     if (nasm->subsnes) { ierr = SNESDestroy(&nasm->subsnes[i]);CHKERRQ(ierr); }
41111ade9eSPeter Brune     if (nasm->oscatter) { ierr = VecScatterDestroy(&nasm->oscatter[i]);CHKERRQ(ierr); }
42111ade9eSPeter Brune     if (nasm->iscatter) { ierr = VecScatterDestroy(&nasm->iscatter[i]);CHKERRQ(ierr); }
43111ade9eSPeter Brune     if (nasm->gscatter) { ierr = VecScatterDestroy(&nasm->gscatter[i]);CHKERRQ(ierr); }
44eaedb033SPeter Brune   }
45111ade9eSPeter Brune 
46111ade9eSPeter Brune   if (nasm->x) {ierr = PetscFree(nasm->x);CHKERRQ(ierr);}
47111ade9eSPeter Brune   if (nasm->xl) {ierr = PetscFree(nasm->xl);CHKERRQ(ierr);}
48111ade9eSPeter Brune   if (nasm->y) {ierr = PetscFree(nasm->y);CHKERRQ(ierr);}
49111ade9eSPeter Brune   if (nasm->b) {ierr = PetscFree(nasm->b);CHKERRQ(ierr);}
50111ade9eSPeter Brune 
51111ade9eSPeter Brune   if (nasm->subsnes) {ierr = PetscFree(nasm->subsnes);CHKERRQ(ierr);}
52111ade9eSPeter Brune   if (nasm->oscatter) {ierr = PetscFree(nasm->oscatter);CHKERRQ(ierr);}
53111ade9eSPeter Brune   if (nasm->iscatter) {ierr = PetscFree(nasm->iscatter);CHKERRQ(ierr);}
54111ade9eSPeter Brune   if (nasm->gscatter) {ierr = PetscFree(nasm->gscatter);CHKERRQ(ierr);}
55b20c023fSPeter Brune 
56b20c023fSPeter Brune   nasm->eventrestrictinterp = 0;
57b20c023fSPeter Brune   nasm->eventsubsolve = 0;
58eaedb033SPeter Brune   PetscFunctionReturn(0);
59eaedb033SPeter Brune }
60eaedb033SPeter Brune 
61eaedb033SPeter Brune #undef __FUNCT__
62eaedb033SPeter Brune #define __FUNCT__ "SNESDestroy_NASM"
63eaedb033SPeter Brune PetscErrorCode SNESDestroy_NASM(SNES snes)
64eaedb033SPeter Brune {
65eaedb033SPeter Brune   PetscErrorCode ierr;
666e111a19SKarl Rupp 
67eaedb033SPeter Brune   PetscFunctionBegin;
68eaedb033SPeter Brune   ierr = SNESReset_NASM(snes);CHKERRQ(ierr);
6922d28d08SBarry Smith   ierr = PetscFree(snes->data);CHKERRQ(ierr);
70eaedb033SPeter Brune   PetscFunctionReturn(0);
71eaedb033SPeter Brune }
72eaedb033SPeter Brune 
73eaedb033SPeter Brune #undef __FUNCT__
74111ade9eSPeter Brune #define __FUNCT__ "DMGlobalToLocalSubDomainDirichletHook_Private"
750adebc6cSBarry Smith PetscErrorCode DMGlobalToLocalSubDomainDirichletHook_Private(DM dm,Vec g,InsertMode mode,Vec l,void *ctx)
760adebc6cSBarry Smith {
77111ade9eSPeter Brune   PetscErrorCode ierr;
78111ade9eSPeter Brune   Vec            bcs = (Vec)ctx;
796e111a19SKarl Rupp 
80111ade9eSPeter Brune   PetscFunctionBegin;
81111ade9eSPeter Brune   ierr = VecCopy(bcs,l);CHKERRQ(ierr);
82111ade9eSPeter Brune   PetscFunctionReturn(0);
83111ade9eSPeter Brune }
84111ade9eSPeter Brune 
85111ade9eSPeter Brune #undef __FUNCT__
86eaedb033SPeter Brune #define __FUNCT__ "SNESSetUp_NASM"
87eaedb033SPeter Brune PetscErrorCode SNESSetUp_NASM(SNES snes)
88eaedb033SPeter Brune {
89eaedb033SPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
90eaedb033SPeter Brune   PetscErrorCode ierr;
9176857b2aSPeter Brune   DM             dm,subdm;
92111ade9eSPeter Brune   DM             *subdms;
93111ade9eSPeter Brune   PetscInt       i;
94eaedb033SPeter Brune   const char     *optionsprefix;
95111ade9eSPeter Brune   Vec            F;
96eaedb033SPeter Brune 
97eaedb033SPeter Brune   PetscFunctionBegin;
98eaedb033SPeter Brune   if (!nasm->subsnes) {
99eaedb033SPeter Brune     ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr);
1000a696f66SPeter Brune     if (dm) {
101eaedb033SPeter Brune       nasm->usesdm = PETSC_TRUE;
1020298fd71SBarry Smith       ierr         = DMCreateDomainDecomposition(dm,&nasm->n,NULL,NULL,NULL,&subdms);CHKERRQ(ierr);
103ce94432eSBarry Smith       if (!subdms) SETERRQ(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_WRONGSTATE,"DM has no default decomposition defined.  Set subsolves manually with SNESNASMSetSubdomains().");
104111ade9eSPeter Brune       ierr = DMCreateDomainDecompositionScatters(dm,nasm->n,subdms,&nasm->iscatter,&nasm->oscatter,&nasm->gscatter);CHKERRQ(ierr);
105eaedb033SPeter Brune 
106eaedb033SPeter Brune       ierr = SNESGetOptionsPrefix(snes, &optionsprefix);CHKERRQ(ierr);
107111ade9eSPeter Brune       ierr = PetscMalloc(nasm->n*sizeof(SNES),&nasm->subsnes);CHKERRQ(ierr);
108111ade9eSPeter Brune 
109111ade9eSPeter Brune       for (i=0; i<nasm->n; i++) {
110cdb298fcSPeter Brune         ierr = SNESCreate(PETSC_COMM_SELF,&nasm->subsnes[i]);CHKERRQ(ierr);
111cdb298fcSPeter Brune         ierr = SNESAppendOptionsPrefix(nasm->subsnes[i],optionsprefix);CHKERRQ(ierr);
112cdb298fcSPeter Brune         ierr = SNESAppendOptionsPrefix(nasm->subsnes[i],"sub_");CHKERRQ(ierr);
113cdb298fcSPeter Brune         ierr = SNESSetDM(nasm->subsnes[i],subdms[i]);CHKERRQ(ierr);
114cdb298fcSPeter Brune         ierr = SNESSetFromOptions(nasm->subsnes[i]);CHKERRQ(ierr);
115111ade9eSPeter Brune         ierr = DMDestroy(&subdms[i]);CHKERRQ(ierr);
116111ade9eSPeter Brune       }
117111ade9eSPeter Brune       ierr = PetscFree(subdms);CHKERRQ(ierr);
118ce94432eSBarry Smith     } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Cannot construct local problems automatically without a DM!");
119ce94432eSBarry Smith   } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Must set subproblems manually if there is no DM!");
120111ade9eSPeter Brune   /* allocate the global vectors */
121111ade9eSPeter Brune   ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->x);CHKERRQ(ierr);
122111ade9eSPeter Brune   ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->xl);CHKERRQ(ierr);
123111ade9eSPeter Brune   ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->y);CHKERRQ(ierr);
124111ade9eSPeter Brune   ierr = PetscMalloc(nasm->n*sizeof(Vec),&nasm->b);CHKERRQ(ierr);
125111ade9eSPeter Brune 
126111ade9eSPeter Brune   for (i=0; i<nasm->n; i++) {
1270298fd71SBarry Smith     ierr = SNESGetFunction(nasm->subsnes[i],&F,NULL,NULL);CHKERRQ(ierr);
12876857b2aSPeter Brune     if (!nasm->x[i]) {ierr = VecDuplicate(F,&nasm->x[i]);CHKERRQ(ierr);}
12976857b2aSPeter Brune     if (!nasm->y[i]) {ierr = VecDuplicate(F,&nasm->y[i]);CHKERRQ(ierr);}
13076857b2aSPeter Brune     if (!nasm->b[i]) {ierr = VecDuplicate(F,&nasm->b[i]);CHKERRQ(ierr);}
13176857b2aSPeter Brune     if (!nasm->xl[i]) {
132111ade9eSPeter Brune       ierr = SNESGetDM(nasm->subsnes[i],&subdm);CHKERRQ(ierr);
133111ade9eSPeter Brune       ierr = DMCreateLocalVector(subdm,&nasm->xl[i]);CHKERRQ(ierr);
13476857b2aSPeter Brune     }
1350298fd71SBarry Smith     ierr = DMGlobalToLocalHookAdd(subdm,DMGlobalToLocalSubDomainDirichletHook_Private,NULL,nasm->xl[i]);CHKERRQ(ierr);
136111ade9eSPeter Brune   }
137*d728fb7dSPeter Brune   if (nasm->finaljacobian) {ierr = SNESSetUpMatrices(snes);CHKERRQ(ierr);}
138eaedb033SPeter Brune   PetscFunctionReturn(0);
139eaedb033SPeter Brune }
140eaedb033SPeter Brune 
141eaedb033SPeter Brune #undef __FUNCT__
142eaedb033SPeter Brune #define __FUNCT__ "SNESSetFromOptions_NASM"
143eaedb033SPeter Brune PetscErrorCode SNESSetFromOptions_NASM(SNES snes)
144eaedb033SPeter Brune {
145eaedb033SPeter Brune   PetscErrorCode    ierr;
146111ade9eSPeter Brune   PCASMType         asmtype;
147b20c023fSPeter Brune   PetscBool         flg,monflg;
148111ade9eSPeter Brune   SNES_NASM         *nasm = (SNES_NASM*)snes->data;
1496e111a19SKarl Rupp 
150eaedb033SPeter Brune   PetscFunctionBegin;
151111ade9eSPeter Brune   ierr = PetscOptionsHead("Nonlinear Additive Schwartz options");CHKERRQ(ierr);
152111ade9eSPeter Brune   ierr = PetscOptionsEnum("-snes_nasm_type","Type of restriction/extension","",SNESNASMTypes,(PetscEnum)nasm->type,(PetscEnum*)&asmtype,&flg);CHKERRQ(ierr);
1531aa26658SKarl Rupp   if (flg) nasm->type = asmtype;
154b20c023fSPeter Brune   flg    = PETSC_FALSE;
155b20c023fSPeter Brune   monflg = PETSC_TRUE;
156b20c023fSPeter Brune   ierr   = PetscOptionsBool("-snes_nasm_log","Log times for subSNES solves and restriction","",monflg,&monflg,&flg);CHKERRQ(ierr);
157*d728fb7dSPeter Brune   ierr   = PetscOptionsBool("-snes_nasm_finaljacobian","Compute the global jacobian of the final iterate (for ASPIN)","",nasm->finaljacobian,&nasm->finaljacobian,NULL);CHKERRQ(ierr);
158b20c023fSPeter Brune   if (flg) {
159b20c023fSPeter Brune     ierr = PetscLogEventRegister("SNESNASMSubSolve",((PetscObject)snes)->classid,&nasm->eventsubsolve);CHKERRQ(ierr);
160b20c023fSPeter Brune     ierr = PetscLogEventRegister("SNESNASMRestrict",((PetscObject)snes)->classid,&nasm->eventrestrictinterp);CHKERRQ(ierr);
161b20c023fSPeter Brune   }
162eaedb033SPeter Brune   ierr = PetscOptionsTail();CHKERRQ(ierr);
163eaedb033SPeter Brune   PetscFunctionReturn(0);
164eaedb033SPeter Brune }
165eaedb033SPeter Brune 
166eaedb033SPeter Brune #undef __FUNCT__
167eaedb033SPeter Brune #define __FUNCT__ "SNESView_NASM"
168eaedb033SPeter Brune PetscErrorCode SNESView_NASM(SNES snes, PetscViewer viewer)
169eaedb033SPeter Brune {
170eaedb033SPeter Brune   PetscFunctionBegin;
171b20c023fSPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
172b20c023fSPeter Brune   PetscErrorCode ierr;
173b20c023fSPeter Brune   PetscMPIInt    rank;
174b20c023fSPeter Brune   PetscInt       i,N;
175b20c023fSPeter Brune   PetscBool      iascii,isstring;
176b20c023fSPeter Brune   PetscViewer    sviewer;
177ce94432eSBarry Smith   MPI_Comm       comm;
178b20c023fSPeter Brune 
179b20c023fSPeter Brune   PetscFunctionBegin;
180ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)snes,&comm);CHKERRQ(ierr);
181b20c023fSPeter Brune   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr);
182b20c023fSPeter Brune   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERSTRING,&isstring);CHKERRQ(ierr);
183b20c023fSPeter Brune   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
184b20c023fSPeter Brune   ierr = MPI_Reduce(&nasm->n,&N,1,MPIU_INT,MPIU_SUM,0,comm);CHKERRQ(ierr);
185b20c023fSPeter Brune   if (iascii) {
186b20c023fSPeter Brune     ierr = PetscViewerASCIIPrintf(viewer, "  Nonlinear Additive Schwarz: total subdomain blocks = %D\n",N);CHKERRQ(ierr);
187b20c023fSPeter Brune     ierr = PetscViewerASCIIPrintf(viewer,"  Nonlinear Additive Schwarz: restriction/interpolation type - %s\n",SNESNASMTypes[nasm->type]);CHKERRQ(ierr);
188b20c023fSPeter Brune     ierr = PetscViewerASCIIPrintf(viewer,"  Nonlinear Additive Schwarz: subSNES iterations: %D subKSP iterations: %D\n",SNESNASMTypes[nasm->type]);CHKERRQ(ierr);
189b20c023fSPeter Brune     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
190b20c023fSPeter Brune     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"  [%d] number of local blocks = %D\n",(int)rank,nasm->n);CHKERRQ(ierr);
191b20c023fSPeter Brune     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
192b20c023fSPeter Brune     ierr = PetscViewerASCIIPrintf(viewer,"  Local SNES objects:\n");CHKERRQ(ierr);
193b20c023fSPeter Brune     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
194b20c023fSPeter Brune     if (!rank) {
195b20c023fSPeter Brune       for (i=0; i<nasm->n; i++) {
196b20c023fSPeter Brune         ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr);
197b20c023fSPeter Brune         ierr = SNESView(nasm->subsnes[i],sviewer);CHKERRQ(ierr);
198b20c023fSPeter Brune         ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr);
199b20c023fSPeter Brune       }
200b20c023fSPeter Brune     }
201b20c023fSPeter Brune     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
202b20c023fSPeter Brune     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
203b20c023fSPeter Brune     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr);
204b20c023fSPeter Brune   } else if (isstring) {
205b20c023fSPeter Brune     ierr = PetscViewerStringSPrintf(viewer," blocks=%D,type=%s",N,SNESNASMTypes[nasm->type]);CHKERRQ(ierr);
206b20c023fSPeter Brune     ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr);
207b20c023fSPeter Brune     if (nasm->subsnes && !rank) {ierr = SNESView(nasm->subsnes[0],sviewer);CHKERRQ(ierr);}
208b20c023fSPeter Brune     ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr);
209b20c023fSPeter Brune   }
210eaedb033SPeter Brune   PetscFunctionReturn(0);
211eaedb033SPeter Brune }
212eaedb033SPeter Brune 
213eaedb033SPeter Brune #undef __FUNCT__
214eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSetSubdomains"
21576857b2aSPeter Brune /*@
21676857b2aSPeter Brune    SNESNASMSetSubdomains - Manually Set the context required to restrict and solve subdomain problems.
21776857b2aSPeter Brune 
21876857b2aSPeter Brune    Not Collective
21976857b2aSPeter Brune 
22076857b2aSPeter Brune    Input Parameters:
22176857b2aSPeter Brune +  SNES - the SNES context
22276857b2aSPeter Brune .  n - the number of local subdomains
22376857b2aSPeter Brune .  subsnes - solvers defined on the local subdomains
22476857b2aSPeter Brune .  iscatter - scatters into the nonoverlapping portions of the local subdomains
22576857b2aSPeter Brune .  oscatter - scatters into the overlapping portions of the local subdomains
22676857b2aSPeter Brune -  gscatter - scatters into the (ghosted) local vector of the local subdomain
22776857b2aSPeter Brune 
22876857b2aSPeter Brune    Level: intermediate
22976857b2aSPeter Brune 
23076857b2aSPeter Brune .keywords: SNES, NASM
23176857b2aSPeter Brune 
23276857b2aSPeter Brune .seealso: SNESNASM, SNESNASMGetSubdomains()
23376857b2aSPeter Brune @*/
234a6dfd86eSKarl Rupp PetscErrorCode SNESNASMSetSubdomains(SNES snes,PetscInt n,SNES subsnes[],VecScatter iscatter[],VecScatter oscatter[],VecScatter gscatter[])
235a6dfd86eSKarl Rupp {
236eaedb033SPeter Brune   PetscErrorCode ierr;
237111ade9eSPeter Brune   PetscErrorCode (*f)(SNES,PetscInt,SNES*,VecScatter*,VecScatter*,VecScatter*);
2386e111a19SKarl Rupp 
239eaedb033SPeter Brune   PetscFunctionBegin;
240eaedb033SPeter Brune   ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMSetSubdomains_C",(void (**)(void))&f);CHKERRQ(ierr);
241111ade9eSPeter Brune   ierr = (f)(snes,n,subsnes,iscatter,oscatter,gscatter);CHKERRQ(ierr);
242eaedb033SPeter Brune   PetscFunctionReturn(0);
243eaedb033SPeter Brune }
244eaedb033SPeter Brune 
245eaedb033SPeter Brune EXTERN_C_BEGIN
246eaedb033SPeter Brune #undef __FUNCT__
247eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSetSubdomains_NASM"
248a6dfd86eSKarl Rupp PetscErrorCode SNESNASMSetSubdomains_NASM(SNES snes,PetscInt n,SNES subsnes[],VecScatter iscatter[],VecScatter oscatter[],VecScatter gscatter[])
249a6dfd86eSKarl Rupp {
250eaedb033SPeter Brune   PetscInt       i;
251eaedb033SPeter Brune   PetscErrorCode ierr;
252eaedb033SPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
2536e111a19SKarl Rupp 
254eaedb033SPeter Brune   PetscFunctionBegin;
255ce94432eSBarry Smith   if (snes->setupcalled) SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"SNESNASMSetSubdomains() should be called before calling SNESSetUp().");
256eaedb033SPeter Brune 
257111ade9eSPeter Brune   /* tear down the previously set things */
258111ade9eSPeter Brune   ierr = SNESReset(snes);CHKERRQ(ierr);
259111ade9eSPeter Brune 
260eaedb033SPeter Brune   nasm->n = n;
261111ade9eSPeter Brune   if (oscatter) {
262111ade9eSPeter Brune     for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)oscatter[i]);CHKERRQ(ierr);}
263eaedb033SPeter Brune   }
264111ade9eSPeter Brune   if (iscatter) {
265111ade9eSPeter Brune     for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)iscatter[i]);CHKERRQ(ierr);}
266eaedb033SPeter Brune   }
267111ade9eSPeter Brune   if (gscatter) {
268111ade9eSPeter Brune     for (i=0; i<n; i++) {ierr = PetscObjectReference((PetscObject)gscatter[i]);CHKERRQ(ierr);}
269111ade9eSPeter Brune   }
270111ade9eSPeter Brune   if (oscatter) {
271111ade9eSPeter Brune     ierr = PetscMalloc(n*sizeof(IS),&nasm->oscatter);CHKERRQ(ierr);
272eaedb033SPeter Brune     for (i=0; i<n; i++) {
273111ade9eSPeter Brune       nasm->oscatter[i] = oscatter[i];
274eaedb033SPeter Brune     }
275111ade9eSPeter Brune   }
276111ade9eSPeter Brune   if (iscatter) {
277111ade9eSPeter Brune     ierr = PetscMalloc(n*sizeof(IS),&nasm->iscatter);CHKERRQ(ierr);
278eaedb033SPeter Brune     for (i=0; i<n; i++) {
279111ade9eSPeter Brune       nasm->iscatter[i] = iscatter[i];
280eaedb033SPeter Brune     }
281eaedb033SPeter Brune   }
282111ade9eSPeter Brune   if (gscatter) {
283111ade9eSPeter Brune     ierr = PetscMalloc(n*sizeof(IS),&nasm->gscatter);CHKERRQ(ierr);
284eaedb033SPeter Brune     for (i=0; i<n; i++) {
285111ade9eSPeter Brune       nasm->gscatter[i] = gscatter[i];
286eaedb033SPeter Brune     }
287eaedb033SPeter Brune   }
288111ade9eSPeter Brune 
289eaedb033SPeter Brune   if (subsnes) {
290eaedb033SPeter Brune     ierr = PetscMalloc(n*sizeof(SNES),&nasm->subsnes);CHKERRQ(ierr);
291eaedb033SPeter Brune     for (i=0; i<n; i++) {
292eaedb033SPeter Brune       nasm->subsnes[i] = subsnes[i];
293eaedb033SPeter Brune     }
294eaedb033SPeter Brune   }
295eaedb033SPeter Brune   PetscFunctionReturn(0);
296eaedb033SPeter Brune }
297eaedb033SPeter Brune EXTERN_C_END
298eaedb033SPeter Brune 
299eaedb033SPeter Brune #undef __FUNCT__
30076857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomains"
30176857b2aSPeter Brune /*@
30276857b2aSPeter Brune    SNESNASMGetSubdomains - Get the local subdomain context.
30376857b2aSPeter Brune 
30476857b2aSPeter Brune    Not Collective
30576857b2aSPeter Brune 
30676857b2aSPeter Brune    Input Parameters:
30776857b2aSPeter Brune .  SNES - the SNES context
30876857b2aSPeter Brune 
30976857b2aSPeter Brune    Output Parameters:
31076857b2aSPeter Brune +  n - the number of local subdomains
31176857b2aSPeter Brune .  subsnes - solvers defined on the local subdomains
31276857b2aSPeter Brune .  iscatter - scatters into the nonoverlapping portions of the local subdomains
31376857b2aSPeter Brune .  oscatter - scatters into the overlapping portions of the local subdomains
31476857b2aSPeter Brune -  gscatter - scatters into the (ghosted) local vector of the local subdomain
31576857b2aSPeter Brune 
31676857b2aSPeter Brune    Level: intermediate
31776857b2aSPeter Brune 
31876857b2aSPeter Brune .keywords: SNES, NASM
31976857b2aSPeter Brune 
32076857b2aSPeter Brune .seealso: SNESNASM, SNESNASMSetSubdomains()
32176857b2aSPeter Brune @*/
32276857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomains(SNES snes,PetscInt *n,SNES *subsnes[],VecScatter *iscatter[],VecScatter *oscatter[],VecScatter *gscatter[])
32376857b2aSPeter Brune {
32476857b2aSPeter Brune   PetscErrorCode ierr;
32576857b2aSPeter Brune   PetscErrorCode (*f)(SNES,PetscInt*,SNES**,VecScatter**,VecScatter**,VecScatter**);
32676857b2aSPeter Brune 
32776857b2aSPeter Brune   PetscFunctionBegin;
32876857b2aSPeter Brune   ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMGetSubdomains_C",(void (**)(void))&f);CHKERRQ(ierr);
32976857b2aSPeter Brune   ierr = (f)(snes,n,subsnes,iscatter,oscatter,gscatter);CHKERRQ(ierr);
33076857b2aSPeter Brune   PetscFunctionReturn(0);
33176857b2aSPeter Brune }
33276857b2aSPeter Brune 
33376857b2aSPeter Brune EXTERN_C_BEGIN
33476857b2aSPeter Brune #undef __FUNCT__
33576857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomains_NASM"
33676857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomains_NASM(SNES snes,PetscInt *n,SNES *subsnes[],VecScatter *iscatter[],VecScatter *oscatter[],VecScatter *gscatter[])
33776857b2aSPeter Brune {
33876857b2aSPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
33976857b2aSPeter Brune 
34076857b2aSPeter Brune   PetscFunctionBegin;
34176857b2aSPeter Brune   if (n) *n = nasm->n;
34276857b2aSPeter Brune   if (oscatter) *oscatter = nasm->oscatter;
34376857b2aSPeter Brune   if (iscatter) *iscatter = nasm->iscatter;
34476857b2aSPeter Brune   if (gscatter) *gscatter = nasm->gscatter;
34576857b2aSPeter Brune   if (subsnes)  *subsnes  = nasm->subsnes;
34676857b2aSPeter Brune   PetscFunctionReturn(0);
34776857b2aSPeter Brune }
34876857b2aSPeter Brune EXTERN_C_END
34976857b2aSPeter Brune 
35076857b2aSPeter Brune #undef __FUNCT__
35176857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomainVecs"
35276857b2aSPeter Brune /*@
35376857b2aSPeter Brune    SNESNASMGetSubdomainVecs - Get the processor-local subdomain vectors
35476857b2aSPeter Brune 
35576857b2aSPeter Brune    Not Collective
35676857b2aSPeter Brune 
35776857b2aSPeter Brune    Input Parameters:
35876857b2aSPeter Brune .  SNES - the SNES context
35976857b2aSPeter Brune 
36076857b2aSPeter Brune    Output Parameters:
36176857b2aSPeter Brune +  n - the number of local subdomains
36276857b2aSPeter Brune .  x - The subdomain solution vector
36376857b2aSPeter Brune .  y - The subdomain step vector
36476857b2aSPeter Brune .  b - The subdomain RHS vector
36576857b2aSPeter Brune -  xl - The subdomain local vectors (ghosted)
36676857b2aSPeter Brune 
36776857b2aSPeter Brune    Level: developer
36876857b2aSPeter Brune 
36976857b2aSPeter Brune .keywords: SNES, NASM
37076857b2aSPeter Brune 
37176857b2aSPeter Brune .seealso: SNESNASM, SNESNASMGetSubdomains()
37276857b2aSPeter Brune @*/
37376857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomainVecs(SNES snes,PetscInt *n,Vec **x,Vec **y,Vec **b, Vec **xl)
37476857b2aSPeter Brune {
37576857b2aSPeter Brune   PetscErrorCode ierr;
37676857b2aSPeter Brune   PetscErrorCode (*f)(SNES,PetscInt*,Vec**,Vec**,Vec**,Vec**);
37776857b2aSPeter Brune 
37876857b2aSPeter Brune   PetscFunctionBegin;
37976857b2aSPeter Brune   ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMGetSubdomainVecs_C",(void (**)(void))&f);CHKERRQ(ierr);
38076857b2aSPeter Brune   ierr = (f)(snes,n,x,y,b,xl);CHKERRQ(ierr);
38176857b2aSPeter Brune   PetscFunctionReturn(0);
38276857b2aSPeter Brune }
38376857b2aSPeter Brune 
38476857b2aSPeter Brune EXTERN_C_BEGIN
38576857b2aSPeter Brune #undef __FUNCT__
38676857b2aSPeter Brune #define __FUNCT__ "SNESNASMGetSubdomainVecs_NASM"
38776857b2aSPeter Brune PetscErrorCode SNESNASMGetSubdomainVecs_NASM(SNES snes,PetscInt *n,Vec **x,Vec **y,Vec **b,Vec **xl)
38876857b2aSPeter Brune {
38976857b2aSPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
39076857b2aSPeter Brune 
39176857b2aSPeter Brune   PetscFunctionBegin;
39276857b2aSPeter Brune   if (n)  *n  = nasm->n;
39376857b2aSPeter Brune   if (x)  *x  = nasm->x;
39476857b2aSPeter Brune   if (y)  *y  = nasm->y;
39576857b2aSPeter Brune   if (b)  *b  = nasm->b;
39676857b2aSPeter Brune   if (xl) *xl = nasm->xl;
39776857b2aSPeter Brune   PetscFunctionReturn(0);
39876857b2aSPeter Brune }
39976857b2aSPeter Brune EXTERN_C_END
40076857b2aSPeter Brune 
401*d728fb7dSPeter Brune #undef __FUNCT__
402*d728fb7dSPeter Brune #define __FUNCT__ "SNESNASMSetComputeFinalJacobian"
403*d728fb7dSPeter Brune /*@
404*d728fb7dSPeter Brune    SNESNASMSetComputeFinalJacobian - Schedules the computation of the global and subdomain jacobians upon convergence
405*d728fb7dSPeter Brune 
406*d728fb7dSPeter Brune    Collective on SNES
407*d728fb7dSPeter Brune 
408*d728fb7dSPeter Brune    Input Parameters:
409*d728fb7dSPeter Brune +  SNES - the SNES context
410*d728fb7dSPeter Brune -  flg - indication of whether to compute the jacobians or not
411*d728fb7dSPeter Brune 
412*d728fb7dSPeter Brune    Level: developer
413*d728fb7dSPeter Brune 
414*d728fb7dSPeter Brune    Notes: This is used almost exclusively in the implementation of ASPIN, where the converged subdomain and global jacobian
415*d728fb7dSPeter Brune    is needed at each linear iteration.
416*d728fb7dSPeter Brune 
417*d728fb7dSPeter Brune .keywords: SNES, NASM, ASPIN
418*d728fb7dSPeter Brune 
419*d728fb7dSPeter Brune .seealso: SNESNASM, SNESNASMGetSubdomains()
420*d728fb7dSPeter Brune @*/
421*d728fb7dSPeter Brune PetscErrorCode SNESNASMSetComputeFinalJacobian(SNES snes,PetscBool flg)
422*d728fb7dSPeter Brune {
423*d728fb7dSPeter Brune   PetscErrorCode (*f)(SNES,PetscBool);
424*d728fb7dSPeter Brune   PetscErrorCode ierr;
425*d728fb7dSPeter Brune 
426*d728fb7dSPeter Brune   PetscFunctionBegin;
427*d728fb7dSPeter Brune   ierr = PetscObjectQueryFunction((PetscObject)snes,"SNESNASMSetComputeFinalJacobian_C",(void (**)(void))&f);CHKERRQ(ierr);
428*d728fb7dSPeter Brune   ierr = (f)(snes,flg);CHKERRQ(ierr);
429*d728fb7dSPeter Brune   PetscFunctionReturn(0);
430*d728fb7dSPeter Brune }
431*d728fb7dSPeter Brune 
432*d728fb7dSPeter Brune EXTERN_C_BEGIN
433*d728fb7dSPeter Brune #undef __FUNCT__
434*d728fb7dSPeter Brune #define __FUNCT__ "SNESNASMSetComputeFinalJacobian_NASM"
435*d728fb7dSPeter Brune PetscErrorCode SNESNASMSetComputeFinalJacobian_NASM(SNES snes,PetscBool flg)
436*d728fb7dSPeter Brune {
437*d728fb7dSPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
438*d728fb7dSPeter Brune 
439*d728fb7dSPeter Brune   PetscFunctionBegin;
440*d728fb7dSPeter Brune   nasm->finaljacobian = flg;
441*d728fb7dSPeter Brune   PetscFunctionReturn(0);
442*d728fb7dSPeter Brune }
443*d728fb7dSPeter Brune EXTERN_C_END
444*d728fb7dSPeter Brune 
44576857b2aSPeter Brune 
44676857b2aSPeter Brune #undef __FUNCT__
447eaedb033SPeter Brune #define __FUNCT__ "SNESNASMSolveLocal_Private"
4480adebc6cSBarry Smith PetscErrorCode SNESNASMSolveLocal_Private(SNES snes,Vec B,Vec Y,Vec X)
4490adebc6cSBarry Smith {
450eaedb033SPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
451258e1594SPeter Brune   SNES           subsnes;
452eaedb033SPeter Brune   PetscInt       i;
453eaedb033SPeter Brune   PetscErrorCode ierr;
454111ade9eSPeter Brune   Vec            Xlloc,Xl,Bl,Yl;
455111ade9eSPeter Brune   VecScatter     iscat,oscat,gscat;
456111ade9eSPeter Brune   DM             dm,subdm;
4570adebc6cSBarry Smith 
458eaedb033SPeter Brune   PetscFunctionBegin;
459eaedb033SPeter Brune   ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr);
460111ade9eSPeter Brune   ierr = VecSet(Y,0);CHKERRQ(ierr);
461b20c023fSPeter Brune 
462b20c023fSPeter Brune   if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);}
463eaedb033SPeter Brune   for (i=0; i<nasm->n; i++) {
46470c78f05SPeter Brune     /* scatter the solution to the local solution */
46570c78f05SPeter Brune     Xlloc = nasm->xl[i];
46670c78f05SPeter Brune     gscat   = nasm->gscatter[i];
46770c78f05SPeter Brune     oscat   = nasm->oscatter[i];
46870c78f05SPeter Brune     ierr = VecScatterBegin(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
46970c78f05SPeter Brune     if (B) {
47070c78f05SPeter Brune       /* scatter the RHS to the local RHS */
47170c78f05SPeter Brune       Bl   = nasm->b[i];
47270c78f05SPeter Brune       ierr = VecScatterBegin(oscat,B,Bl,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47370c78f05SPeter Brune     }
47470c78f05SPeter Brune   }
475b20c023fSPeter Brune   if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);}
476b20c023fSPeter Brune 
47770c78f05SPeter Brune   for (i=0; i<nasm->n; i++) {
47870c78f05SPeter Brune     Xlloc = nasm->xl[i];
479d590fa63SPeter Brune     gscat   = nasm->gscatter[i];
480d590fa63SPeter Brune     oscat   = nasm->oscatter[i];
48170c78f05SPeter Brune     ierr = VecScatterEnd(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
48270c78f05SPeter Brune     if (B) {
48324b7f281SPeter Brune       Bl   = nasm->b[i];
48470c78f05SPeter Brune       ierr = VecScatterEnd(oscat,B,Bl,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
48570c78f05SPeter Brune     }
48670c78f05SPeter Brune   }
487b20c023fSPeter Brune 
488b20c023fSPeter Brune   if (nasm->eventsubsolve) {ierr = PetscLogEventBegin(nasm->eventsubsolve,snes,0,0,0);CHKERRQ(ierr);}
48970c78f05SPeter Brune   for (i=0; i<nasm->n; i++) {
49070c78f05SPeter Brune     Xl    = nasm->x[i];
49170c78f05SPeter Brune     Xlloc = nasm->xl[i];
49270c78f05SPeter Brune     Yl    = nasm->y[i];
493258e1594SPeter Brune     subsnes = nasm->subsnes[i];
494258e1594SPeter Brune     ierr    = SNESGetDM(subsnes,&subdm);CHKERRQ(ierr);
495111ade9eSPeter Brune     iscat   = nasm->iscatter[i];
496111ade9eSPeter Brune     oscat   = nasm->oscatter[i];
497111ade9eSPeter Brune     gscat   = nasm->gscatter[i];
498111ade9eSPeter Brune     ierr    = DMSubDomainRestrict(dm,oscat,gscat,subdm);CHKERRQ(ierr);
49924b7f281SPeter Brune     if (B) {
50024b7f281SPeter Brune       Bl = nasm->b[i];
50124b7f281SPeter Brune     } else {
50224b7f281SPeter Brune       Bl = NULL;
50324b7f281SPeter Brune     }
50470c78f05SPeter Brune     ierr = DMLocalToGlobalBegin(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr);
50570c78f05SPeter Brune     ierr = DMLocalToGlobalEnd(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr);
506111ade9eSPeter Brune     ierr = VecCopy(Xl,Yl);CHKERRQ(ierr);
507258e1594SPeter Brune     ierr = SNESSolve(subsnes,Bl,Yl);CHKERRQ(ierr);
508111ade9eSPeter Brune     ierr = VecAXPY(Yl,-1.0,Xl);CHKERRQ(ierr);
50970c78f05SPeter Brune   }
510b20c023fSPeter Brune   if (nasm->eventsubsolve) {ierr = PetscLogEventEnd(nasm->eventsubsolve,snes,0,0,0);CHKERRQ(ierr);}
511111ade9eSPeter Brune 
512ce94432eSBarry Smith   ierr = MPI_Barrier(PetscObjectComm((PetscObject)snes));CHKERRQ(ierr);
51370c78f05SPeter Brune 
514b20c023fSPeter Brune   if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);}
51570c78f05SPeter Brune   for (i=0; i<nasm->n; i++) {
51670c78f05SPeter Brune     Yl    = nasm->y[i];
51770c78f05SPeter Brune     iscat   = nasm->iscatter[i];
51870c78f05SPeter Brune     oscat   = nasm->oscatter[i];
519111ade9eSPeter Brune     if (nasm->type == PC_ASM_BASIC) {
520111ade9eSPeter Brune       ierr = VecScatterBegin(oscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
521111ade9eSPeter Brune     } else if (nasm->type == PC_ASM_RESTRICT) {
522111ade9eSPeter Brune       ierr = VecScatterBegin(iscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
523ce94432eSBarry Smith     } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Only basic and restrict types are supported for SNESNASM");
524eaedb033SPeter Brune   }
525eaedb033SPeter Brune 
52670c78f05SPeter Brune   for (i=0; i<nasm->n; i++) {
52770c78f05SPeter Brune     Yl    = nasm->y[i];
52870c78f05SPeter Brune     iscat   = nasm->iscatter[i];
52970c78f05SPeter Brune     oscat   = nasm->oscatter[i];
53070c78f05SPeter Brune     if (nasm->type == PC_ASM_BASIC) {
53170c78f05SPeter Brune       ierr = VecScatterEnd(oscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
53270c78f05SPeter Brune     } else if (nasm->type == PC_ASM_RESTRICT) {
53370c78f05SPeter Brune       ierr = VecScatterEnd(iscat,Yl,Y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
534ce94432eSBarry Smith     } else SETERRQ(PetscObjectComm((PetscObject)snes),PETSC_ERR_ARG_WRONGSTATE,"Only basic and restrict types are supported for SNESNASM");
53570c78f05SPeter Brune   }
536b20c023fSPeter Brune   if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);}
53770c78f05SPeter Brune 
538ce94432eSBarry Smith   ierr = MPI_Barrier(PetscObjectComm((PetscObject)snes));CHKERRQ(ierr);
539cd939e56SPeter Brune 
540111ade9eSPeter Brune   ierr = VecAXPY(X,1.0,Y);CHKERRQ(ierr);
541eaedb033SPeter Brune   PetscFunctionReturn(0);
542eaedb033SPeter Brune }
543eaedb033SPeter Brune 
544eaedb033SPeter Brune #undef __FUNCT__
545*d728fb7dSPeter Brune #define __FUNCT__ "SNESNASMComputeFinalJacobian_Private"
546*d728fb7dSPeter Brune PetscErrorCode SNESNASMComputeFinalJacobian_Private(SNES snes, Vec X)
547*d728fb7dSPeter Brune {
548*d728fb7dSPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
549*d728fb7dSPeter Brune   SNES           subsnes;
550*d728fb7dSPeter Brune   PetscInt       i;
551*d728fb7dSPeter Brune   PetscErrorCode ierr;
552*d728fb7dSPeter Brune   Vec            Xlloc,Xl;
553*d728fb7dSPeter Brune   VecScatter     oscat,gscat;
554*d728fb7dSPeter Brune   DM             dm,subdm;
555*d728fb7dSPeter Brune   MatStructure   flg = DIFFERENT_NONZERO_PATTERN;
556*d728fb7dSPeter Brune 
557*d728fb7dSPeter Brune   PetscFunctionBegin;
558*d728fb7dSPeter Brune   ierr = SNESComputeJacobian(snes,X,&snes->jacobian,&snes->jacobian_pre,&flg);CHKERRQ(ierr);
559*d728fb7dSPeter Brune   ierr = SNESGetDM(snes,&dm);CHKERRQ(ierr);
560*d728fb7dSPeter Brune   if (nasm->eventrestrictinterp) {ierr = PetscLogEventBegin(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);}
561*d728fb7dSPeter Brune   for (i=0; i<nasm->n; i++) {
562*d728fb7dSPeter Brune     /* scatter the solution to the local solution */
563*d728fb7dSPeter Brune     Xlloc = nasm->xl[i];
564*d728fb7dSPeter Brune     gscat   = nasm->gscatter[i];
565*d728fb7dSPeter Brune     oscat   = nasm->oscatter[i];
566*d728fb7dSPeter Brune     ierr = VecScatterBegin(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
567*d728fb7dSPeter Brune   }
568*d728fb7dSPeter Brune   if (nasm->eventrestrictinterp) {ierr = PetscLogEventEnd(nasm->eventrestrictinterp,snes,0,0,0);CHKERRQ(ierr);}
569*d728fb7dSPeter Brune 
570*d728fb7dSPeter Brune   for (i=0; i<nasm->n; i++) {
571*d728fb7dSPeter Brune     Xlloc = nasm->xl[i];
572*d728fb7dSPeter Brune     gscat   = nasm->gscatter[i];
573*d728fb7dSPeter Brune     oscat   = nasm->oscatter[i];
574*d728fb7dSPeter Brune     ierr = VecScatterEnd(gscat,X,Xlloc,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
575*d728fb7dSPeter Brune   }
576*d728fb7dSPeter Brune 
577*d728fb7dSPeter Brune   for (i=0; i<nasm->n; i++) {
578*d728fb7dSPeter Brune     Xl    = nasm->x[i];
579*d728fb7dSPeter Brune     Xlloc = nasm->xl[i];
580*d728fb7dSPeter Brune     subsnes = nasm->subsnes[i];
581*d728fb7dSPeter Brune     ierr    = SNESGetDM(subsnes,&subdm);CHKERRQ(ierr);
582*d728fb7dSPeter Brune     oscat   = nasm->oscatter[i];
583*d728fb7dSPeter Brune     gscat   = nasm->gscatter[i];
584*d728fb7dSPeter Brune     ierr    = DMSubDomainRestrict(dm,oscat,gscat,subdm);CHKERRQ(ierr);
585*d728fb7dSPeter Brune     ierr = DMLocalToGlobalBegin(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr);
586*d728fb7dSPeter Brune     ierr = DMLocalToGlobalEnd(subdm,Xlloc,INSERT_VALUES,Xl);CHKERRQ(ierr);
587*d728fb7dSPeter Brune     ierr = SNESComputeJacobian(subsnes,Xl,&snes->jacobian,&subsnes->jacobian_pre,&flg);CHKERRQ(ierr);
588*d728fb7dSPeter Brune     ierr = KSPSetOperators(subsnes->ksp,subsnes->jacobian,subsnes->jacobian_pre,flg);CHKERRQ(ierr);
589*d728fb7dSPeter Brune   }
590*d728fb7dSPeter Brune 
591*d728fb7dSPeter Brune   ierr = MPI_Barrier(PetscObjectComm((PetscObject)snes));CHKERRQ(ierr);
592*d728fb7dSPeter Brune   PetscFunctionReturn(0);
593*d728fb7dSPeter Brune }
594*d728fb7dSPeter Brune 
595*d728fb7dSPeter Brune #undef __FUNCT__
596eaedb033SPeter Brune #define __FUNCT__ "SNESSolve_NASM"
597eaedb033SPeter Brune PetscErrorCode SNESSolve_NASM(SNES snes)
598eaedb033SPeter Brune {
599eaedb033SPeter Brune   Vec            F;
600eaedb033SPeter Brune   Vec            X;
601eaedb033SPeter Brune   Vec            B;
602111ade9eSPeter Brune   Vec            Y;
603eaedb033SPeter Brune   PetscInt       i;
604eaedb033SPeter Brune   PetscReal      fnorm;
605eaedb033SPeter Brune   PetscErrorCode ierr;
606eaedb033SPeter Brune   SNESNormType   normtype;
607*d728fb7dSPeter Brune   SNES_NASM      *nasm = (SNES_NASM*)snes->data;
608eaedb033SPeter Brune 
609eaedb033SPeter Brune   PetscFunctionBegin;
610eaedb033SPeter Brune   X = snes->vec_sol;
611111ade9eSPeter Brune   Y = snes->vec_sol_update;
612eaedb033SPeter Brune   F = snes->vec_func;
613eaedb033SPeter Brune   B = snes->vec_rhs;
614eaedb033SPeter Brune 
615eaedb033SPeter Brune   ierr         = PetscObjectTakeAccess(snes);CHKERRQ(ierr);
616eaedb033SPeter Brune   snes->iter   = 0;
617eaedb033SPeter Brune   snes->norm   = 0.;
618eaedb033SPeter Brune   ierr         = PetscObjectGrantAccess(snes);CHKERRQ(ierr);
619eaedb033SPeter Brune   snes->reason = SNES_CONVERGED_ITERATING;
620eaedb033SPeter Brune   ierr         = SNESGetNormType(snes, &normtype);CHKERRQ(ierr);
621eaedb033SPeter Brune   if (normtype == SNES_NORM_FUNCTION || normtype == SNES_NORM_INITIAL_ONLY || normtype == SNES_NORM_INITIAL_FINAL_ONLY) {
622eaedb033SPeter Brune     /* compute the initial function and preconditioned update delX */
623eaedb033SPeter Brune     if (!snes->vec_func_init_set) {
624eaedb033SPeter Brune       ierr = SNESComputeFunction(snes,X,F);CHKERRQ(ierr);
625eaedb033SPeter Brune       if (snes->domainerror) {
626eaedb033SPeter Brune         snes->reason = SNES_DIVERGED_FUNCTION_DOMAIN;
627eaedb033SPeter Brune         PetscFunctionReturn(0);
628eaedb033SPeter Brune       }
6291aa26658SKarl Rupp     } else snes->vec_func_init_set = PETSC_FALSE;
630eaedb033SPeter Brune 
631eaedb033SPeter Brune     /* convergence test */
632eaedb033SPeter Brune     if (!snes->norm_init_set) {
633eaedb033SPeter Brune       ierr = VecNorm(F, NORM_2, &fnorm);CHKERRQ(ierr); /* fnorm <- ||F||  */
634eaedb033SPeter Brune       if (PetscIsInfOrNanReal(fnorm)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FP,"Infinite or not-a-number generated in norm");
635eaedb033SPeter Brune     } else {
636eaedb033SPeter Brune       fnorm               = snes->norm_init;
637eaedb033SPeter Brune       snes->norm_init_set = PETSC_FALSE;
638eaedb033SPeter Brune     }
639eaedb033SPeter Brune     ierr       = PetscObjectTakeAccess(snes);CHKERRQ(ierr);
640eaedb033SPeter Brune     snes->iter = 0;
641eaedb033SPeter Brune     snes->norm = fnorm;
642eaedb033SPeter Brune     ierr       = PetscObjectGrantAccess(snes);CHKERRQ(ierr);
643a71f0d7dSBarry Smith     ierr       = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr);
644eaedb033SPeter Brune     ierr       = SNESMonitor(snes,0,snes->norm);CHKERRQ(ierr);
645eaedb033SPeter Brune 
646eaedb033SPeter Brune     /* set parameter for default relative tolerance convergence test */
647eaedb033SPeter Brune     snes->ttol = fnorm*snes->rtol;
648eaedb033SPeter Brune 
649eaedb033SPeter Brune     /* test convergence */
650eaedb033SPeter Brune     ierr = (*snes->ops->converged)(snes,0,0.0,0.0,fnorm,&snes->reason,snes->cnvP);CHKERRQ(ierr);
651eaedb033SPeter Brune     if (snes->reason) PetscFunctionReturn(0);
652eaedb033SPeter Brune   } else {
653eaedb033SPeter Brune     ierr = PetscObjectGrantAccess(snes);CHKERRQ(ierr);
654a71f0d7dSBarry Smith     ierr = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr);
655eaedb033SPeter Brune     ierr = SNESMonitor(snes,0,snes->norm);CHKERRQ(ierr);
656eaedb033SPeter Brune   }
657eaedb033SPeter Brune 
658eaedb033SPeter Brune   /* Call general purpose update function */
659eaedb033SPeter Brune   if (snes->ops->update) {
660eaedb033SPeter Brune     ierr = (*snes->ops->update)(snes, snes->iter);CHKERRQ(ierr);
661eaedb033SPeter Brune   }
662eaedb033SPeter Brune 
663eaedb033SPeter Brune   for (i = 0; i < snes->max_its; i++) {
664111ade9eSPeter Brune     ierr = SNESNASMSolveLocal_Private(snes,B,Y,X);CHKERRQ(ierr);
665eaedb033SPeter Brune     if (normtype == SNES_NORM_FUNCTION || ((i == snes->max_its - 1) && (normtype == SNES_NORM_INITIAL_FINAL_ONLY || normtype == SNES_NORM_FINAL_ONLY))) {
666eaedb033SPeter Brune       ierr = SNESComputeFunction(snes,X,F);CHKERRQ(ierr);
667eaedb033SPeter Brune       if (snes->domainerror) {
668eaedb033SPeter Brune         snes->reason = SNES_DIVERGED_FUNCTION_DOMAIN;
669*d728fb7dSPeter Brune         break;
670eaedb033SPeter Brune       }
671eaedb033SPeter Brune       ierr = VecNorm(F, NORM_2, &fnorm);CHKERRQ(ierr); /* fnorm <- ||F||  */
672eaedb033SPeter Brune       if (PetscIsInfOrNanReal(fnorm)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FP,"Infinite or not-a-number generated in norm");
673eaedb033SPeter Brune     }
674eaedb033SPeter Brune     /* Monitor convergence */
675eaedb033SPeter Brune     ierr       = PetscObjectTakeAccess(snes);CHKERRQ(ierr);
676eaedb033SPeter Brune     snes->iter = i+1;
677eaedb033SPeter Brune     snes->norm = fnorm;
678eaedb033SPeter Brune     ierr       = PetscObjectGrantAccess(snes);CHKERRQ(ierr);
679a71f0d7dSBarry Smith     ierr       = SNESLogConvergenceHistory(snes,snes->norm,0);CHKERRQ(ierr);
680eaedb033SPeter Brune     ierr       = SNESMonitor(snes,snes->iter,snes->norm);CHKERRQ(ierr);
681eaedb033SPeter Brune     /* Test for convergence */
682eaedb033SPeter Brune     if (normtype == SNES_NORM_FUNCTION) ierr = (*snes->ops->converged)(snes,snes->iter,0.0,0.0,fnorm,&snes->reason,snes->cnvP);CHKERRQ(ierr);
683*d728fb7dSPeter Brune     if (snes->reason) break;
684eaedb033SPeter Brune     /* Call general purpose update function */
685eaedb033SPeter Brune     if (snes->ops->update) {
686eaedb033SPeter Brune       ierr = (*snes->ops->update)(snes, snes->iter);CHKERRQ(ierr);
687eaedb033SPeter Brune     }
688eaedb033SPeter Brune   }
689*d728fb7dSPeter Brune   if (nasm->finaljacobian) {ierr = SNESNASMComputeFinalJacobian_Private(snes,X);CHKERRQ(ierr);}
690eaedb033SPeter Brune   if (normtype == SNES_NORM_FUNCTION) {
691eaedb033SPeter Brune     if (i == snes->max_its) {
692eaedb033SPeter Brune       ierr = PetscInfo1(snes,"Maximum number of iterations has been reached: %D\n",snes->max_its);CHKERRQ(ierr);
693eaedb033SPeter Brune       if (!snes->reason) snes->reason = SNES_DIVERGED_MAX_IT;
694eaedb033SPeter Brune     }
6951aa26658SKarl Rupp   } else if (!snes->reason) snes->reason = SNES_CONVERGED_ITS; /* NASM is meant to be used as a preconditioner */
696eaedb033SPeter Brune   PetscFunctionReturn(0);
697eaedb033SPeter Brune }
698eaedb033SPeter Brune 
699eaedb033SPeter Brune /*MC
700eaedb033SPeter Brune   SNESNASM - Nonlinear Additive Schwartz
701eaedb033SPeter Brune 
702eaedb033SPeter Brune    Level: advanced
703eaedb033SPeter Brune 
704eaedb033SPeter Brune .seealso: SNESCreate(), SNES, SNESSetType(), SNESType (for list of available types)
705eaedb033SPeter Brune M*/
706eaedb033SPeter Brune 
707eaedb033SPeter Brune EXTERN_C_BEGIN
708eaedb033SPeter Brune #undef __FUNCT__
709eaedb033SPeter Brune #define __FUNCT__ "SNESCreate_NASM"
710eaedb033SPeter Brune PetscErrorCode SNESCreate_NASM(SNES snes)
711eaedb033SPeter Brune {
712eaedb033SPeter Brune   SNES_NASM      *nasm;
713eaedb033SPeter Brune   PetscErrorCode ierr;
714eaedb033SPeter Brune 
715eaedb033SPeter Brune   PetscFunctionBegin;
716eaedb033SPeter Brune   ierr       = PetscNewLog(snes, SNES_NASM, &nasm);CHKERRQ(ierr);
717eaedb033SPeter Brune   snes->data = (void*)nasm;
718eaedb033SPeter Brune 
719eaedb033SPeter Brune   nasm->n        = PETSC_DECIDE;
720eaedb033SPeter Brune   nasm->subsnes  = 0;
721eaedb033SPeter Brune   nasm->x        = 0;
722111ade9eSPeter Brune   nasm->xl       = 0;
723111ade9eSPeter Brune   nasm->y        = 0;
724eaedb033SPeter Brune   nasm->b        = 0;
725111ade9eSPeter Brune   nasm->oscatter = 0;
726111ade9eSPeter Brune   nasm->iscatter = 0;
727111ade9eSPeter Brune   nasm->gscatter = 0;
728111ade9eSPeter Brune 
729111ade9eSPeter Brune   nasm->type = PC_ASM_BASIC;
730*d728fb7dSPeter Brune   nasm->finaljacobian = PETSC_FALSE;
731eaedb033SPeter Brune 
732eaedb033SPeter Brune   snes->ops->destroy        = SNESDestroy_NASM;
733eaedb033SPeter Brune   snes->ops->setup          = SNESSetUp_NASM;
734eaedb033SPeter Brune   snes->ops->setfromoptions = SNESSetFromOptions_NASM;
735eaedb033SPeter Brune   snes->ops->view           = SNESView_NASM;
736eaedb033SPeter Brune   snes->ops->solve          = SNESSolve_NASM;
737eaedb033SPeter Brune   snes->ops->reset          = SNESReset_NASM;
738eaedb033SPeter Brune 
739eaedb033SPeter Brune   snes->usesksp = PETSC_FALSE;
740eaedb033SPeter Brune   snes->usespc  = PETSC_FALSE;
741eaedb033SPeter Brune 
7420298fd71SBarry Smith   nasm->eventrestrictinterp = 0;
7430298fd71SBarry Smith   nasm->eventsubsolve       = 0;
744b20c023fSPeter Brune 
745eaedb033SPeter Brune   if (!snes->tolerancesset) {
746eaedb033SPeter Brune     snes->max_its   = 10000;
747eaedb033SPeter Brune     snes->max_funcs = 10000;
748eaedb033SPeter Brune   }
749eaedb033SPeter Brune 
750eaedb033SPeter Brune   ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMSetSubdomains_C","SNESNASMSetSubdomains_NASM",
751eaedb033SPeter Brune                                            SNESNASMSetSubdomains_NASM);CHKERRQ(ierr);
75276857b2aSPeter Brune   ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMGetSubdomains_C","SNESNASMGetSubdomains_NASM",
75376857b2aSPeter Brune                                            SNESNASMGetSubdomains_NASM);CHKERRQ(ierr);
75476857b2aSPeter Brune   ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMGetSubdomainVecs_C","SNESNASMGetSubdomainVecs_NASM",
75576857b2aSPeter Brune                                            SNESNASMGetSubdomainVecs_NASM);CHKERRQ(ierr);
756*d728fb7dSPeter Brune   ierr = PetscObjectComposeFunctionDynamic((PetscObject)snes,"SNESNASMSetComputeFinalJacobian_C","SNESNASMSetComputeFinalJacobian_NASM",
757*d728fb7dSPeter Brune                                            SNESNASMSetComputeFinalJacobian_NASM);CHKERRQ(ierr);
758eaedb033SPeter Brune   PetscFunctionReturn(0);
759eaedb033SPeter Brune }
760eaedb033SPeter Brune EXTERN_C_END
761