xref: /petsc/src/dm/impls/plex/plexfem.c (revision 40e14135f9d92c5492101d3e2d19fc90af32d9f7)
1cb1e1211SMatthew G Knepley #include <petsc-private/dmpleximpl.h>   /*I      "petscdmplex.h"   I*/
2cb1e1211SMatthew G Knepley 
3a0845e3aSMatthew G. Knepley #include <petscfe.h>
4a0845e3aSMatthew G. Knepley 
5cb1e1211SMatthew G Knepley #undef __FUNCT__
6cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexGetScale"
7cb1e1211SMatthew G Knepley PetscErrorCode DMPlexGetScale(DM dm, PetscUnit unit, PetscReal *scale)
8cb1e1211SMatthew G Knepley {
9cb1e1211SMatthew G Knepley   DM_Plex *mesh = (DM_Plex*) dm->data;
10cb1e1211SMatthew G Knepley 
11cb1e1211SMatthew G Knepley   PetscFunctionBegin;
12cb1e1211SMatthew G Knepley   PetscValidHeaderSpecific(dm, DM_CLASSID, 1);
13cb1e1211SMatthew G Knepley   PetscValidPointer(scale, 3);
14cb1e1211SMatthew G Knepley   *scale = mesh->scale[unit];
15cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
16cb1e1211SMatthew G Knepley }
17cb1e1211SMatthew G Knepley 
18cb1e1211SMatthew G Knepley #undef __FUNCT__
19cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexSetScale"
20cb1e1211SMatthew G Knepley PetscErrorCode DMPlexSetScale(DM dm, PetscUnit unit, PetscReal scale)
21cb1e1211SMatthew G Knepley {
22cb1e1211SMatthew G Knepley   DM_Plex *mesh = (DM_Plex*) dm->data;
23cb1e1211SMatthew G Knepley 
24cb1e1211SMatthew G Knepley   PetscFunctionBegin;
25cb1e1211SMatthew G Knepley   PetscValidHeaderSpecific(dm, DM_CLASSID, 1);
26cb1e1211SMatthew G Knepley   mesh->scale[unit] = scale;
27cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
28cb1e1211SMatthew G Knepley }
29cb1e1211SMatthew G Knepley 
30cb1e1211SMatthew G Knepley PETSC_STATIC_INLINE PetscInt epsilon(PetscInt i, PetscInt j, PetscInt k)
31cb1e1211SMatthew G Knepley {
32cb1e1211SMatthew G Knepley   switch (i) {
33cb1e1211SMatthew G Knepley   case 0:
34cb1e1211SMatthew G Knepley     switch (j) {
35cb1e1211SMatthew G Knepley     case 0: return 0;
36cb1e1211SMatthew G Knepley     case 1:
37cb1e1211SMatthew G Knepley       switch (k) {
38cb1e1211SMatthew G Knepley       case 0: return 0;
39cb1e1211SMatthew G Knepley       case 1: return 0;
40cb1e1211SMatthew G Knepley       case 2: return 1;
41cb1e1211SMatthew G Knepley       }
42cb1e1211SMatthew G Knepley     case 2:
43cb1e1211SMatthew G Knepley       switch (k) {
44cb1e1211SMatthew G Knepley       case 0: return 0;
45cb1e1211SMatthew G Knepley       case 1: return -1;
46cb1e1211SMatthew G Knepley       case 2: return 0;
47cb1e1211SMatthew G Knepley       }
48cb1e1211SMatthew G Knepley     }
49cb1e1211SMatthew G Knepley   case 1:
50cb1e1211SMatthew G Knepley     switch (j) {
51cb1e1211SMatthew G Knepley     case 0:
52cb1e1211SMatthew G Knepley       switch (k) {
53cb1e1211SMatthew G Knepley       case 0: return 0;
54cb1e1211SMatthew G Knepley       case 1: return 0;
55cb1e1211SMatthew G Knepley       case 2: return -1;
56cb1e1211SMatthew G Knepley       }
57cb1e1211SMatthew G Knepley     case 1: return 0;
58cb1e1211SMatthew G Knepley     case 2:
59cb1e1211SMatthew G Knepley       switch (k) {
60cb1e1211SMatthew G Knepley       case 0: return 1;
61cb1e1211SMatthew G Knepley       case 1: return 0;
62cb1e1211SMatthew G Knepley       case 2: return 0;
63cb1e1211SMatthew G Knepley       }
64cb1e1211SMatthew G Knepley     }
65cb1e1211SMatthew G Knepley   case 2:
66cb1e1211SMatthew G Knepley     switch (j) {
67cb1e1211SMatthew G Knepley     case 0:
68cb1e1211SMatthew G Knepley       switch (k) {
69cb1e1211SMatthew G Knepley       case 0: return 0;
70cb1e1211SMatthew G Knepley       case 1: return 1;
71cb1e1211SMatthew G Knepley       case 2: return 0;
72cb1e1211SMatthew G Knepley       }
73cb1e1211SMatthew G Knepley     case 1:
74cb1e1211SMatthew G Knepley       switch (k) {
75cb1e1211SMatthew G Knepley       case 0: return -1;
76cb1e1211SMatthew G Knepley       case 1: return 0;
77cb1e1211SMatthew G Knepley       case 2: return 0;
78cb1e1211SMatthew G Knepley       }
79cb1e1211SMatthew G Knepley     case 2: return 0;
80cb1e1211SMatthew G Knepley     }
81cb1e1211SMatthew G Knepley   }
82cb1e1211SMatthew G Knepley   return 0;
83cb1e1211SMatthew G Knepley }
84cb1e1211SMatthew G Knepley 
85cb1e1211SMatthew G Knepley #undef __FUNCT__
86cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexCreateRigidBody"
87cb1e1211SMatthew G Knepley /*@C
88cb1e1211SMatthew G Knepley   DMPlexCreateRigidBody - create rigid body modes from coordinates
89cb1e1211SMatthew G Knepley 
90cb1e1211SMatthew G Knepley   Collective on DM
91cb1e1211SMatthew G Knepley 
92cb1e1211SMatthew G Knepley   Input Arguments:
93cb1e1211SMatthew G Knepley + dm - the DM
94cb1e1211SMatthew G Knepley . section - the local section associated with the rigid field, or NULL for the default section
95cb1e1211SMatthew G Knepley - globalSection - the global section associated with the rigid field, or NULL for the default section
96cb1e1211SMatthew G Knepley 
97cb1e1211SMatthew G Knepley   Output Argument:
98cb1e1211SMatthew G Knepley . sp - the null space
99cb1e1211SMatthew G Knepley 
100cb1e1211SMatthew G Knepley   Note: This is necessary to take account of Dirichlet conditions on the displacements
101cb1e1211SMatthew G Knepley 
102cb1e1211SMatthew G Knepley   Level: advanced
103cb1e1211SMatthew G Knepley 
104cb1e1211SMatthew G Knepley .seealso: MatNullSpaceCreate()
105cb1e1211SMatthew G Knepley @*/
106cb1e1211SMatthew G Knepley PetscErrorCode DMPlexCreateRigidBody(DM dm, PetscSection section, PetscSection globalSection, MatNullSpace *sp)
107cb1e1211SMatthew G Knepley {
108cb1e1211SMatthew G Knepley   MPI_Comm       comm;
109cb1e1211SMatthew G Knepley   Vec            coordinates, localMode, mode[6];
110cb1e1211SMatthew G Knepley   PetscSection   coordSection;
111cb1e1211SMatthew G Knepley   PetscScalar   *coords;
112cb1e1211SMatthew G Knepley   PetscInt       dim, vStart, vEnd, v, n, m, d, i, j;
113cb1e1211SMatthew G Knepley   PetscErrorCode ierr;
114cb1e1211SMatthew G Knepley 
115cb1e1211SMatthew G Knepley   PetscFunctionBegin;
116cb1e1211SMatthew G Knepley   ierr = PetscObjectGetComm((PetscObject)dm,&comm);CHKERRQ(ierr);
117cb1e1211SMatthew G Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
118cb1e1211SMatthew G Knepley   if (dim == 1) {
119cb1e1211SMatthew G Knepley     ierr = MatNullSpaceCreate(comm, PETSC_TRUE, 0, NULL, sp);CHKERRQ(ierr);
120cb1e1211SMatthew G Knepley     PetscFunctionReturn(0);
121cb1e1211SMatthew G Knepley   }
122cb1e1211SMatthew G Knepley   if (!section)       {ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);}
123cb1e1211SMatthew G Knepley   if (!globalSection) {ierr = DMGetDefaultGlobalSection(dm, &globalSection);CHKERRQ(ierr);}
124cb1e1211SMatthew G Knepley   ierr = PetscSectionGetConstrainedStorageSize(globalSection, &n);CHKERRQ(ierr);
125cb1e1211SMatthew G Knepley   ierr = DMPlexGetDepthStratum(dm, 0, &vStart, &vEnd);CHKERRQ(ierr);
12669d8a9ceSMatthew G. Knepley   ierr = DMGetCoordinateSection(dm, &coordSection);CHKERRQ(ierr);
127cb1e1211SMatthew G Knepley   ierr = DMGetCoordinatesLocal(dm, &coordinates);CHKERRQ(ierr);
128cb1e1211SMatthew G Knepley   m    = (dim*(dim+1))/2;
129cb1e1211SMatthew G Knepley   ierr = VecCreate(comm, &mode[0]);CHKERRQ(ierr);
130cb1e1211SMatthew G Knepley   ierr = VecSetSizes(mode[0], n, PETSC_DETERMINE);CHKERRQ(ierr);
131cb1e1211SMatthew G Knepley   ierr = VecSetUp(mode[0]);CHKERRQ(ierr);
132cb1e1211SMatthew G Knepley   for (i = 1; i < m; ++i) {ierr = VecDuplicate(mode[0], &mode[i]);CHKERRQ(ierr);}
133cb1e1211SMatthew G Knepley   /* Assume P1 */
134cb1e1211SMatthew G Knepley   ierr = DMGetLocalVector(dm, &localMode);CHKERRQ(ierr);
135cb1e1211SMatthew G Knepley   for (d = 0; d < dim; ++d) {
136cb1e1211SMatthew G Knepley     PetscScalar values[3] = {0.0, 0.0, 0.0};
137cb1e1211SMatthew G Knepley 
138cb1e1211SMatthew G Knepley     values[d] = 1.0;
139cb1e1211SMatthew G Knepley     ierr      = VecSet(localMode, 0.0);CHKERRQ(ierr);
140cb1e1211SMatthew G Knepley     for (v = vStart; v < vEnd; ++v) {
141cb1e1211SMatthew G Knepley       ierr = DMPlexVecSetClosure(dm, section, localMode, v, values, INSERT_VALUES);CHKERRQ(ierr);
142cb1e1211SMatthew G Knepley     }
143cb1e1211SMatthew G Knepley     ierr = DMLocalToGlobalBegin(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr);
144cb1e1211SMatthew G Knepley     ierr = DMLocalToGlobalEnd(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr);
145cb1e1211SMatthew G Knepley   }
146cb1e1211SMatthew G Knepley   ierr = VecGetArray(coordinates, &coords);CHKERRQ(ierr);
147cb1e1211SMatthew G Knepley   for (d = dim; d < dim*(dim+1)/2; ++d) {
148cb1e1211SMatthew G Knepley     PetscInt i, j, k = dim > 2 ? d - dim : d;
149cb1e1211SMatthew G Knepley 
150cb1e1211SMatthew G Knepley     ierr = VecSet(localMode, 0.0);CHKERRQ(ierr);
151cb1e1211SMatthew G Knepley     for (v = vStart; v < vEnd; ++v) {
152cb1e1211SMatthew G Knepley       PetscScalar values[3] = {0.0, 0.0, 0.0};
153cb1e1211SMatthew G Knepley       PetscInt    off;
154cb1e1211SMatthew G Knepley 
155cb1e1211SMatthew G Knepley       ierr = PetscSectionGetOffset(coordSection, v, &off);CHKERRQ(ierr);
156cb1e1211SMatthew G Knepley       for (i = 0; i < dim; ++i) {
157cb1e1211SMatthew G Knepley         for (j = 0; j < dim; ++j) {
158cb1e1211SMatthew G Knepley           values[j] += epsilon(i, j, k)*PetscRealPart(coords[off+i]);
159cb1e1211SMatthew G Knepley         }
160cb1e1211SMatthew G Knepley       }
161cb1e1211SMatthew G Knepley       ierr = DMPlexVecSetClosure(dm, section, localMode, v, values, INSERT_VALUES);CHKERRQ(ierr);
162cb1e1211SMatthew G Knepley     }
163cb1e1211SMatthew G Knepley     ierr = DMLocalToGlobalBegin(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr);
164cb1e1211SMatthew G Knepley     ierr = DMLocalToGlobalEnd(dm, localMode, INSERT_VALUES, mode[d]);CHKERRQ(ierr);
165cb1e1211SMatthew G Knepley   }
166cb1e1211SMatthew G Knepley   ierr = VecRestoreArray(coordinates, &coords);CHKERRQ(ierr);
167cb1e1211SMatthew G Knepley   ierr = DMRestoreLocalVector(dm, &localMode);CHKERRQ(ierr);
168cb1e1211SMatthew G Knepley   for (i = 0; i < dim; ++i) {ierr = VecNormalize(mode[i], NULL);CHKERRQ(ierr);}
169cb1e1211SMatthew G Knepley   /* Orthonormalize system */
170cb1e1211SMatthew G Knepley   for (i = dim; i < m; ++i) {
171cb1e1211SMatthew G Knepley     PetscScalar dots[6];
172cb1e1211SMatthew G Knepley 
173cb1e1211SMatthew G Knepley     ierr = VecMDot(mode[i], i, mode, dots);CHKERRQ(ierr);
174cb1e1211SMatthew G Knepley     for (j = 0; j < i; ++j) dots[j] *= -1.0;
175cb1e1211SMatthew G Knepley     ierr = VecMAXPY(mode[i], i, dots, mode);CHKERRQ(ierr);
176cb1e1211SMatthew G Knepley     ierr = VecNormalize(mode[i], NULL);CHKERRQ(ierr);
177cb1e1211SMatthew G Knepley   }
178cb1e1211SMatthew G Knepley   ierr = MatNullSpaceCreate(comm, PETSC_FALSE, m, mode, sp);CHKERRQ(ierr);
179cb1e1211SMatthew G Knepley   for (i = 0; i< m; ++i) {ierr = VecDestroy(&mode[i]);CHKERRQ(ierr);}
180cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
181cb1e1211SMatthew G Knepley }
182cb1e1211SMatthew G Knepley 
183cb1e1211SMatthew G Knepley #undef __FUNCT__
184cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexProjectFunctionLocal"
18572f94c41SMatthew G. Knepley PetscErrorCode DMPlexProjectFunctionLocal(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], PetscScalar *), InsertMode mode, Vec localX)
186cb1e1211SMatthew G Knepley {
18772f94c41SMatthew G. Knepley   PetscDualSpace *sp;
18872f94c41SMatthew G. Knepley   PetscSection    section;
18972f94c41SMatthew G. Knepley   PetscScalar    *values;
19072f94c41SMatthew G. Knepley   PetscReal      *v0, *J, detJ;
19172f94c41SMatthew G. Knepley   PetscInt        numFields, numComp, dim, spDim, totDim = 0, numValues, cStart, cEnd, c, f, d, v;
192cb1e1211SMatthew G Knepley   PetscErrorCode  ierr;
193cb1e1211SMatthew G Knepley 
194cb1e1211SMatthew G Knepley   PetscFunctionBegin;
195cb1e1211SMatthew G Knepley   ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);
19672f94c41SMatthew G. Knepley   ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr);
197785e854fSJed Brown   ierr = PetscMalloc1(numFields, &sp);CHKERRQ(ierr);
19872f94c41SMatthew G. Knepley   for (f = 0; f < numFields; ++f) {
19972f94c41SMatthew G. Knepley     ierr = PetscFEGetDualSpace(fe[f], &sp[f]);CHKERRQ(ierr);
20072f94c41SMatthew G. Knepley     ierr = PetscFEGetNumComponents(fe[f], &numComp);CHKERRQ(ierr);
20172f94c41SMatthew G. Knepley     ierr = PetscDualSpaceGetDimension(sp[f], &spDim);CHKERRQ(ierr);
20272f94c41SMatthew G. Knepley     totDim += spDim*numComp;
203cb1e1211SMatthew G Knepley   }
20472f94c41SMatthew G. Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
20572f94c41SMatthew G. Knepley   ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr);
20672f94c41SMatthew G. Knepley   ierr = DMPlexVecGetClosure(dm, section, localX, cStart, &numValues, NULL);CHKERRQ(ierr);
20772f94c41SMatthew G. Knepley   if (numValues != totDim) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "The section cell closure size %d != dual space dimension %d", numValues, totDim);
20872f94c41SMatthew G. Knepley   ierr = DMGetWorkArray(dm, numValues, PETSC_SCALAR, &values);CHKERRQ(ierr);
209dcca6d9dSJed Brown   ierr = PetscMalloc2(dim,&v0,dim*dim,&J);CHKERRQ(ierr);
21072f94c41SMatthew G. Knepley   for (c = cStart; c < cEnd; ++c) {
21172f94c41SMatthew G. Knepley     PetscCellGeometry geom;
212cb1e1211SMatthew G Knepley 
213cb1e1211SMatthew G Knepley     ierr = DMPlexComputeCellGeometry(dm, c, v0, J, NULL, &detJ);CHKERRQ(ierr);
21472f94c41SMatthew G. Knepley     geom.v0   = v0;
21572f94c41SMatthew G. Knepley     geom.J    = J;
21672f94c41SMatthew G. Knepley     geom.detJ = &detJ;
21772f94c41SMatthew G. Knepley     for (f = 0, v = 0; f < numFields; ++f) {
21872f94c41SMatthew G. Knepley       ierr = PetscFEGetNumComponents(fe[f], &numComp);CHKERRQ(ierr);
21972f94c41SMatthew G. Knepley       ierr = PetscDualSpaceGetDimension(sp[f], &spDim);CHKERRQ(ierr);
22072f94c41SMatthew G. Knepley       for (d = 0; d < spDim; ++d) {
22172f94c41SMatthew G. Knepley         ierr = PetscDualSpaceApply(sp[f], d, geom, numComp, funcs[f], &values[v]);CHKERRQ(ierr);
22272f94c41SMatthew G. Knepley         v += numComp;
223cb1e1211SMatthew G Knepley       }
224cb1e1211SMatthew G Knepley     }
22572f94c41SMatthew G. Knepley     ierr = DMPlexVecSetClosure(dm, section, localX, c, values, mode);CHKERRQ(ierr);
226cb1e1211SMatthew G Knepley   }
22772f94c41SMatthew G. Knepley   ierr = DMRestoreWorkArray(dm, numValues, PETSC_SCALAR, &values);CHKERRQ(ierr);
2281f2da991SMatthew G. Knepley   ierr = PetscFree2(v0,J);CHKERRQ(ierr);
22972f94c41SMatthew G. Knepley   ierr = PetscFree(sp);CHKERRQ(ierr);
230cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
231cb1e1211SMatthew G Knepley }
232cb1e1211SMatthew G Knepley 
233cb1e1211SMatthew G Knepley #undef __FUNCT__
234cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexProjectFunction"
235cb1e1211SMatthew G Knepley /*@C
236cb1e1211SMatthew G Knepley   DMPlexProjectFunction - This projects the given function into the function space provided.
237cb1e1211SMatthew G Knepley 
238cb1e1211SMatthew G Knepley   Input Parameters:
239cb1e1211SMatthew G Knepley + dm      - The DM
24072f94c41SMatthew G. Knepley . fe      - The PetscFE associated with the field
24172f94c41SMatthew G. Knepley . funcs   - The coordinate functions to evaluate, one per field
242cb1e1211SMatthew G Knepley - mode    - The insertion mode for values
243cb1e1211SMatthew G Knepley 
244cb1e1211SMatthew G Knepley   Output Parameter:
245cb1e1211SMatthew G Knepley . X - vector
246cb1e1211SMatthew G Knepley 
247cb1e1211SMatthew G Knepley   Level: developer
248cb1e1211SMatthew G Knepley 
249878cb397SSatish Balay .seealso: DMPlexComputeL2Diff()
250878cb397SSatish Balay @*/
25172f94c41SMatthew G. Knepley PetscErrorCode DMPlexProjectFunction(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], PetscScalar *), InsertMode mode, Vec X)
252cb1e1211SMatthew G Knepley {
253cb1e1211SMatthew G Knepley   Vec            localX;
254cb1e1211SMatthew G Knepley   PetscErrorCode ierr;
255cb1e1211SMatthew G Knepley 
256cb1e1211SMatthew G Knepley   PetscFunctionBegin;
2579a800dd8SMatthew G. Knepley   PetscValidHeaderSpecific(dm, DM_CLASSID, 1);
258cb1e1211SMatthew G Knepley   ierr = DMGetLocalVector(dm, &localX);CHKERRQ(ierr);
25972f94c41SMatthew G. Knepley   ierr = DMPlexProjectFunctionLocal(dm, fe, funcs, mode, localX);CHKERRQ(ierr);
260cb1e1211SMatthew G Knepley   ierr = DMLocalToGlobalBegin(dm, localX, mode, X);CHKERRQ(ierr);
261cb1e1211SMatthew G Knepley   ierr = DMLocalToGlobalEnd(dm, localX, mode, X);CHKERRQ(ierr);
262cb1e1211SMatthew G Knepley   ierr = DMRestoreLocalVector(dm, &localX);CHKERRQ(ierr);
263cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
264cb1e1211SMatthew G Knepley }
265cb1e1211SMatthew G Knepley 
266cb1e1211SMatthew G Knepley #undef __FUNCT__
267cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeL2Diff"
268cb1e1211SMatthew G Knepley /*@C
269cb1e1211SMatthew G Knepley   DMPlexComputeL2Diff - This function computes the L_2 difference between a function u and an FEM interpolant solution u_h.
270cb1e1211SMatthew G Knepley 
271cb1e1211SMatthew G Knepley   Input Parameters:
272cb1e1211SMatthew G Knepley + dm    - The DM
273c5bbbd5bSMatthew G. Knepley . fe    - The PetscFE object for each field
274cb1e1211SMatthew G Knepley . funcs - The functions to evaluate for each field component
275cb1e1211SMatthew G Knepley - X     - The coefficient vector u_h
276cb1e1211SMatthew G Knepley 
277cb1e1211SMatthew G Knepley   Output Parameter:
278cb1e1211SMatthew G Knepley . diff - The diff ||u - u_h||_2
279cb1e1211SMatthew G Knepley 
280cb1e1211SMatthew G Knepley   Level: developer
281cb1e1211SMatthew G Knepley 
282cb1e1211SMatthew G Knepley .seealso: DMPlexProjectFunction()
283878cb397SSatish Balay @*/
284c5bbbd5bSMatthew G. Knepley PetscErrorCode DMPlexComputeL2Diff(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], PetscScalar *), Vec X, PetscReal *diff)
285cb1e1211SMatthew G Knepley {
286cb1e1211SMatthew G Knepley   const PetscInt  debug = 0;
287cb1e1211SMatthew G Knepley   PetscSection    section;
288c5bbbd5bSMatthew G. Knepley   PetscQuadrature quad;
289cb1e1211SMatthew G Knepley   Vec             localX;
29072f94c41SMatthew G. Knepley   PetscScalar    *funcVal;
291cb1e1211SMatthew G Knepley   PetscReal      *coords, *v0, *J, *invJ, detJ;
292cb1e1211SMatthew G Knepley   PetscReal       localDiff = 0.0;
293cb1e1211SMatthew G Knepley   PetscInt        dim, numFields, numComponents = 0, cStart, cEnd, c, field, fieldOffset, comp;
294cb1e1211SMatthew G Knepley   PetscErrorCode  ierr;
295cb1e1211SMatthew G Knepley 
296cb1e1211SMatthew G Knepley   PetscFunctionBegin;
297cb1e1211SMatthew G Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
298cb1e1211SMatthew G Knepley   ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);
299cb1e1211SMatthew G Knepley   ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr);
300cb1e1211SMatthew G Knepley   ierr = DMGetLocalVector(dm, &localX);CHKERRQ(ierr);
301cb1e1211SMatthew G Knepley   ierr = DMGlobalToLocalBegin(dm, X, INSERT_VALUES, localX);CHKERRQ(ierr);
302cb1e1211SMatthew G Knepley   ierr = DMGlobalToLocalEnd(dm, X, INSERT_VALUES, localX);CHKERRQ(ierr);
303cb1e1211SMatthew G Knepley   for (field = 0; field < numFields; ++field) {
304c5bbbd5bSMatthew G. Knepley     PetscInt Nc;
305c5bbbd5bSMatthew G. Knepley 
306c5bbbd5bSMatthew G. Knepley     ierr = PetscFEGetNumComponents(fe[field], &Nc);CHKERRQ(ierr);
307c5bbbd5bSMatthew G. Knepley     numComponents += Nc;
308cb1e1211SMatthew G Knepley   }
30972f94c41SMatthew G. Knepley   ierr = DMPlexProjectFunctionLocal(dm, fe, funcs, INSERT_BC_VALUES, localX);CHKERRQ(ierr);
310dcca6d9dSJed Brown   ierr = PetscMalloc5(numComponents,&funcVal,dim,&coords,dim,&v0,dim*dim,&J,dim*dim,&invJ);CHKERRQ(ierr);
311cb1e1211SMatthew G Knepley   ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr);
312c5bbbd5bSMatthew G. Knepley   ierr = PetscFEGetQuadrature(fe[0], &quad);CHKERRQ(ierr);
313cb1e1211SMatthew G Knepley   for (c = cStart; c < cEnd; ++c) {
314a1e44745SMatthew G. Knepley     PetscScalar *x = NULL;
315cb1e1211SMatthew G Knepley     PetscReal    elemDiff = 0.0;
316cb1e1211SMatthew G Knepley 
317cb1e1211SMatthew G Knepley     ierr = DMPlexComputeCellGeometry(dm, c, v0, J, invJ, &detJ);CHKERRQ(ierr);
318cb1e1211SMatthew G Knepley     if (detJ <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ, c);
319cb1e1211SMatthew G Knepley     ierr = DMPlexVecGetClosure(dm, NULL, localX, c, NULL, &x);CHKERRQ(ierr);
320cb1e1211SMatthew G Knepley 
321cb1e1211SMatthew G Knepley     for (field = 0, comp = 0, fieldOffset = 0; field < numFields; ++field) {
322f9fd7fdbSMatthew G. Knepley       const PetscInt   numQuadPoints = quad.numPoints;
323f9fd7fdbSMatthew G. Knepley       const PetscReal *quadPoints    = quad.points;
324f9fd7fdbSMatthew G. Knepley       const PetscReal *quadWeights   = quad.weights;
325c5bbbd5bSMatthew G. Knepley       PetscReal       *basis;
326c5bbbd5bSMatthew G. Knepley       PetscInt         numBasisFuncs, numBasisComps, q, d, e, fc, f;
327cb1e1211SMatthew G Knepley 
328c5bbbd5bSMatthew G. Knepley       ierr = PetscFEGetDimension(fe[field], &numBasisFuncs);CHKERRQ(ierr);
329c5bbbd5bSMatthew G. Knepley       ierr = PetscFEGetNumComponents(fe[field], &numBasisComps);CHKERRQ(ierr);
330c5bbbd5bSMatthew G. Knepley       ierr = PetscFEGetDefaultTabulation(fe[field], &basis, NULL, NULL);CHKERRQ(ierr);
331cb1e1211SMatthew G Knepley       if (debug) {
332cb1e1211SMatthew G Knepley         char title[1024];
333cb1e1211SMatthew G Knepley         ierr = PetscSNPrintf(title, 1023, "Solution for Field %d", field);CHKERRQ(ierr);
334cb1e1211SMatthew G Knepley         ierr = DMPrintCellVector(c, title, numBasisFuncs*numBasisComps, &x[fieldOffset]);CHKERRQ(ierr);
335cb1e1211SMatthew G Knepley       }
336cb1e1211SMatthew G Knepley       for (q = 0; q < numQuadPoints; ++q) {
337cb1e1211SMatthew G Knepley         for (d = 0; d < dim; d++) {
338cb1e1211SMatthew G Knepley           coords[d] = v0[d];
339cb1e1211SMatthew G Knepley           for (e = 0; e < dim; e++) {
340cb1e1211SMatthew G Knepley             coords[d] += J[d*dim+e]*(quadPoints[q*dim+e] + 1.0);
341cb1e1211SMatthew G Knepley           }
342cb1e1211SMatthew G Knepley         }
34372f94c41SMatthew G. Knepley         (*funcs[field])(coords, funcVal);
344cb1e1211SMatthew G Knepley         for (fc = 0; fc < numBasisComps; ++fc) {
345a1d24da5SMatthew G. Knepley           PetscScalar interpolant = 0.0;
346a1d24da5SMatthew G. Knepley 
347cb1e1211SMatthew G Knepley           for (f = 0; f < numBasisFuncs; ++f) {
348cb1e1211SMatthew G Knepley             const PetscInt fidx = f*numBasisComps+fc;
349a1d24da5SMatthew G. Knepley             interpolant += x[fieldOffset+fidx]*basis[q*numBasisFuncs*numBasisComps+fidx];
350cb1e1211SMatthew G Knepley           }
35172f94c41SMatthew G. Knepley           if (debug) {ierr = PetscPrintf(PETSC_COMM_SELF, "    elem %d field %d diff %g\n", c, field, PetscSqr(PetscRealPart(interpolant - funcVal[fc]))*quadWeights[q]*detJ);CHKERRQ(ierr);}
35272f94c41SMatthew G. Knepley           elemDiff += PetscSqr(PetscRealPart(interpolant - funcVal[fc]))*quadWeights[q]*detJ;
353cb1e1211SMatthew G Knepley         }
354cb1e1211SMatthew G Knepley       }
355cb1e1211SMatthew G Knepley       comp        += numBasisComps;
356cb1e1211SMatthew G Knepley       fieldOffset += numBasisFuncs*numBasisComps;
357cb1e1211SMatthew G Knepley     }
358cb1e1211SMatthew G Knepley     ierr = DMPlexVecRestoreClosure(dm, NULL, localX, c, NULL, &x);CHKERRQ(ierr);
359cb1e1211SMatthew G Knepley     if (debug) {ierr = PetscPrintf(PETSC_COMM_SELF, "  elem %d diff %g\n", c, elemDiff);CHKERRQ(ierr);}
360cb1e1211SMatthew G Knepley     localDiff += elemDiff;
361cb1e1211SMatthew G Knepley   }
36272f94c41SMatthew G. Knepley   ierr  = PetscFree5(funcVal,coords,v0,J,invJ);CHKERRQ(ierr);
363cb1e1211SMatthew G Knepley   ierr  = DMRestoreLocalVector(dm, &localX);CHKERRQ(ierr);
36486a74ee0SMatthew G. Knepley   ierr  = MPI_Allreduce(&localDiff, diff, 1, MPIU_REAL, MPI_SUM, PetscObjectComm((PetscObject)dm));CHKERRQ(ierr);
365cb1e1211SMatthew G Knepley   *diff = PetscSqrtReal(*diff);
366cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
367cb1e1211SMatthew G Knepley }
368cb1e1211SMatthew G Knepley 
369cb1e1211SMatthew G Knepley #undef __FUNCT__
370*40e14135SMatthew G. Knepley #define __FUNCT__ "DMPlexComputeL2GradientDiff"
371*40e14135SMatthew G. Knepley /*@C
372*40e14135SMatthew G. Knepley   DMPlexComputeL2GradientDiff - This function computes the L_2 difference between the gradient of a function u and an FEM interpolant solution grad u_h.
373*40e14135SMatthew G. Knepley 
374*40e14135SMatthew G. Knepley   Input Parameters:
375*40e14135SMatthew G. Knepley + dm    - The DM
376*40e14135SMatthew G. Knepley . fe    - The PetscFE object for each field
377*40e14135SMatthew G. Knepley . funcs - The gradient functions to evaluate for each field component
378*40e14135SMatthew G. Knepley . X     - The coefficient vector u_h
379*40e14135SMatthew G. Knepley - n     - The vector to project along
380*40e14135SMatthew G. Knepley 
381*40e14135SMatthew G. Knepley   Output Parameter:
382*40e14135SMatthew G. Knepley . diff - The diff ||(grad u - grad u_h) . n||_2
383*40e14135SMatthew G. Knepley 
384*40e14135SMatthew G. Knepley   Level: developer
385*40e14135SMatthew G. Knepley 
386*40e14135SMatthew G. Knepley .seealso: DMPlexProjectFunction(), DMPlexComputeL2Diff()
387*40e14135SMatthew G. Knepley @*/
388*40e14135SMatthew G. Knepley PetscErrorCode DMPlexComputeL2GradientDiff(DM dm, PetscFE fe[], void (**funcs)(const PetscReal [], const PetscReal [], PetscScalar *), Vec X, const PetscReal n[], PetscReal *diff)
389cb1e1211SMatthew G Knepley {
390*40e14135SMatthew G. Knepley   const PetscInt  debug = 0;
391cb1e1211SMatthew G Knepley   PetscSection    section;
392*40e14135SMatthew G. Knepley   PetscQuadrature quad;
393*40e14135SMatthew G. Knepley   Vec             localX;
394*40e14135SMatthew G. Knepley   PetscScalar    *funcVal, *interpolantVec;
395*40e14135SMatthew G. Knepley   PetscReal      *coords, *realSpaceDer, *v0, *J, *invJ, detJ;
396*40e14135SMatthew G. Knepley   PetscReal       localDiff = 0.0;
397*40e14135SMatthew G. Knepley   PetscInt        dim, numFields, numComponents = 0, cStart, cEnd, c, field, fieldOffset, comp;
398cb1e1211SMatthew G Knepley   PetscErrorCode  ierr;
399cb1e1211SMatthew G Knepley 
400cb1e1211SMatthew G Knepley   PetscFunctionBegin;
401*40e14135SMatthew G. Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
402*40e14135SMatthew G. Knepley   ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);
403*40e14135SMatthew G. Knepley   ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr);
404*40e14135SMatthew G. Knepley   ierr = DMGetLocalVector(dm, &localX);CHKERRQ(ierr);
405*40e14135SMatthew G. Knepley   ierr = DMGlobalToLocalBegin(dm, X, INSERT_VALUES, localX);CHKERRQ(ierr);
406*40e14135SMatthew G. Knepley   ierr = DMGlobalToLocalEnd(dm, X, INSERT_VALUES, localX);CHKERRQ(ierr);
407652b88e8SMatthew G. Knepley   for (field = 0; field < numFields; ++field) {
408*40e14135SMatthew G. Knepley     PetscInt Nc;
409652b88e8SMatthew G. Knepley 
410*40e14135SMatthew G. Knepley     ierr = PetscFEGetNumComponents(fe[field], &Nc);CHKERRQ(ierr);
411*40e14135SMatthew G. Knepley     numComponents += Nc;
412652b88e8SMatthew G. Knepley   }
413*40e14135SMatthew G. Knepley   /* ierr = DMPlexProjectFunctionLocal(dm, fe, funcs, INSERT_BC_VALUES, localX);CHKERRQ(ierr); */
414*40e14135SMatthew G. Knepley   ierr = PetscMalloc7(numComponents,&funcVal,dim,&coords,dim,&realSpaceDer,dim,&v0,dim*dim,&J,dim*dim,&invJ,dim,&interpolantVec);CHKERRQ(ierr);
415*40e14135SMatthew G. Knepley   ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr);
416*40e14135SMatthew G. Knepley   ierr = PetscFEGetQuadrature(fe[0], &quad);CHKERRQ(ierr);
417*40e14135SMatthew G. Knepley   for (c = cStart; c < cEnd; ++c) {
418*40e14135SMatthew G. Knepley     PetscScalar *x = NULL;
419*40e14135SMatthew G. Knepley     PetscReal    elemDiff = 0.0;
420652b88e8SMatthew G. Knepley 
421*40e14135SMatthew G. Knepley     ierr = DMPlexComputeCellGeometry(dm, c, v0, J, invJ, &detJ);CHKERRQ(ierr);
422*40e14135SMatthew G. Knepley     if (detJ <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ, c);
423*40e14135SMatthew G. Knepley     ierr = DMPlexVecGetClosure(dm, NULL, localX, c, NULL, &x);CHKERRQ(ierr);
424*40e14135SMatthew G. Knepley 
425*40e14135SMatthew G. Knepley     for (field = 0, comp = 0, fieldOffset = 0; field < numFields; ++field) {
426*40e14135SMatthew G. Knepley       const PetscInt   numQuadPoints = quad.numPoints;
427*40e14135SMatthew G. Knepley       const PetscReal *quadPoints    = quad.points;
428*40e14135SMatthew G. Knepley       const PetscReal *quadWeights   = quad.weights;
429*40e14135SMatthew G. Knepley       PetscReal       *basisDer;
430*40e14135SMatthew G. Knepley       PetscInt         Nb, Ncomp, q, d, e, fc, f, g;
431*40e14135SMatthew G. Knepley 
432*40e14135SMatthew G. Knepley       ierr = PetscFEGetDimension(fe[field], &Nb);CHKERRQ(ierr);
433*40e14135SMatthew G. Knepley       ierr = PetscFEGetNumComponents(fe[field], &Ncomp);CHKERRQ(ierr);
434*40e14135SMatthew G. Knepley       ierr = PetscFEGetDefaultTabulation(fe[field], NULL, &basisDer, NULL);CHKERRQ(ierr);
435*40e14135SMatthew G. Knepley       if (debug) {
436*40e14135SMatthew G. Knepley         char title[1024];
437*40e14135SMatthew G. Knepley         ierr = PetscSNPrintf(title, 1023, "Solution for Field %d", field);CHKERRQ(ierr);
438*40e14135SMatthew G. Knepley         ierr = DMPrintCellVector(c, title, Nb*Ncomp, &x[fieldOffset]);CHKERRQ(ierr);
439652b88e8SMatthew G. Knepley       }
440*40e14135SMatthew G. Knepley       for (q = 0; q < numQuadPoints; ++q) {
441*40e14135SMatthew G. Knepley         for (d = 0; d < dim; d++) {
442*40e14135SMatthew G. Knepley           coords[d] = v0[d];
443*40e14135SMatthew G. Knepley           for (e = 0; e < dim; e++) {
444*40e14135SMatthew G. Knepley             coords[d] += J[d*dim+e]*(quadPoints[q*dim+e] + 1.0);
445652b88e8SMatthew G. Knepley           }
446*40e14135SMatthew G. Knepley         }
447*40e14135SMatthew G. Knepley         (*funcs[field])(coords, n, funcVal);
448*40e14135SMatthew G. Knepley         for (fc = 0; fc < Ncomp; ++fc) {
449*40e14135SMatthew G. Knepley           PetscScalar interpolant = 0.0;
450*40e14135SMatthew G. Knepley 
451*40e14135SMatthew G. Knepley           for (d = 0; d < dim; ++d) interpolantVec[d] = 0.0;
452*40e14135SMatthew G. Knepley           for (f = 0; f < Nb; ++f) {
453*40e14135SMatthew G. Knepley             const PetscInt fidx = f*Ncomp+fc;
454*40e14135SMatthew G. Knepley 
455*40e14135SMatthew G. Knepley             for (d = 0; d < dim; ++d) {
456*40e14135SMatthew G. Knepley               realSpaceDer[d] = 0.0;
457*40e14135SMatthew G. Knepley               for (g = 0; g < dim; ++g) {
458*40e14135SMatthew G. Knepley                 realSpaceDer[d] += invJ[g*dim+d]*basisDer[(q*Nb*Ncomp+fidx)*dim+g];
459*40e14135SMatthew G. Knepley               }
460*40e14135SMatthew G. Knepley               interpolantVec[d] += x[fieldOffset+fidx]*realSpaceDer[d];
461*40e14135SMatthew G. Knepley             }
462*40e14135SMatthew G. Knepley           }
463*40e14135SMatthew G. Knepley           for (d = 0; d < dim; ++d) interpolant += interpolantVec[d]*n[d];
464*40e14135SMatthew G. Knepley           if (debug) {ierr = PetscPrintf(PETSC_COMM_SELF, "    elem %d fieldDer %d diff %g\n", c, field, PetscSqr(PetscRealPart(interpolant - funcVal[fc]))*quadWeights[q]*detJ);CHKERRQ(ierr);}
465*40e14135SMatthew G. Knepley           elemDiff += PetscSqr(PetscRealPart(interpolant - funcVal[fc]))*quadWeights[q]*detJ;
466*40e14135SMatthew G. Knepley         }
467*40e14135SMatthew G. Knepley       }
468*40e14135SMatthew G. Knepley       comp        += Ncomp;
469*40e14135SMatthew G. Knepley       fieldOffset += Nb*Ncomp;
470*40e14135SMatthew G. Knepley     }
471*40e14135SMatthew G. Knepley     ierr = DMPlexVecRestoreClosure(dm, NULL, localX, c, NULL, &x);CHKERRQ(ierr);
472*40e14135SMatthew G. Knepley     if (debug) {ierr = PetscPrintf(PETSC_COMM_SELF, "  elem %d diff %g\n", c, elemDiff);CHKERRQ(ierr);}
473*40e14135SMatthew G. Knepley     localDiff += elemDiff;
474*40e14135SMatthew G. Knepley   }
475*40e14135SMatthew G. Knepley     ierr  = PetscFree7(funcVal,coords,realSpaceDer,v0,J,invJ,interpolantVec);CHKERRQ(ierr);
476*40e14135SMatthew G. Knepley   ierr  = DMRestoreLocalVector(dm, &localX);CHKERRQ(ierr);
477*40e14135SMatthew G. Knepley   ierr  = MPI_Allreduce(&localDiff, diff, 1, MPIU_REAL, MPI_SUM, PetscObjectComm((PetscObject)dm));CHKERRQ(ierr);
478*40e14135SMatthew G. Knepley   *diff = PetscSqrtReal(*diff);
479cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
480cb1e1211SMatthew G Knepley }
481cb1e1211SMatthew G Knepley 
482a0845e3aSMatthew G. Knepley #undef __FUNCT__
483a0845e3aSMatthew G. Knepley #define __FUNCT__ "DMPlexComputeResidualFEM"
484a0845e3aSMatthew G. Knepley /*@
485a0845e3aSMatthew G. Knepley   DMPlexComputeResidualFEM - Form the local residual F from the local input X using pointwise functions specified by the user
486a0845e3aSMatthew G. Knepley 
487a0845e3aSMatthew G. Knepley   Input Parameters:
488a0845e3aSMatthew G. Knepley + dm - The mesh
489a0845e3aSMatthew G. Knepley . X  - Local input vector
490a0845e3aSMatthew G. Knepley - user - The user context
491a0845e3aSMatthew G. Knepley 
492a0845e3aSMatthew G. Knepley   Output Parameter:
493a0845e3aSMatthew G. Knepley . F  - Local output vector
494a0845e3aSMatthew G. Knepley 
495a0845e3aSMatthew G. Knepley   Note:
496a0845e3aSMatthew G. Knepley   The second member of the user context must be an FEMContext.
497a0845e3aSMatthew G. Knepley 
498a0845e3aSMatthew G. Knepley   We form the residual one batch of elements at a time. This allows us to offload work onto an accelerator,
499a0845e3aSMatthew G. Knepley   like a GPU, or vectorize on a multicore machine.
500a0845e3aSMatthew G. Knepley 
501a0845e3aSMatthew G. Knepley   Level: developer
502a0845e3aSMatthew G. Knepley 
503a0845e3aSMatthew G. Knepley .seealso: DMPlexComputeJacobianActionFEM()
504a0845e3aSMatthew G. Knepley @*/
505a0845e3aSMatthew G. Knepley PetscErrorCode DMPlexComputeResidualFEM(DM dm, Vec X, Vec F, void *user)
506a0845e3aSMatthew G. Knepley {
507a0845e3aSMatthew G. Knepley   DM_Plex          *mesh  = (DM_Plex *) dm->data;
5089a559087SMatthew G. Knepley   PetscFEM         *fem   = (PetscFEM *) user;
509a0845e3aSMatthew G. Knepley   PetscFE          *fe    = fem->fe;
5109a559087SMatthew G. Knepley   PetscFE          *feAux = fem->feAux;
511f1ea0e2fSMatthew G. Knepley   PetscFE          *feBd  = fem->feBd;
512a0845e3aSMatthew G. Knepley   const char       *name  = "Residual";
5139a559087SMatthew G. Knepley   DM                dmAux;
5149a559087SMatthew G. Knepley   Vec               A;
515a0845e3aSMatthew G. Knepley   PetscQuadrature   q;
516a0845e3aSMatthew G. Knepley   PetscCellGeometry geom;
5179a559087SMatthew G. Knepley   PetscSection      section, sectionAux;
518a0845e3aSMatthew G. Knepley   PetscReal        *v0, *J, *invJ, *detJ;
5199a559087SMatthew G. Knepley   PetscScalar      *elemVec, *u, *a;
5209a559087SMatthew G. Knepley   PetscInt          dim, Nf, NfAux = 0, f, numCells, cStart, cEnd, c;
521a0845e3aSMatthew G. Knepley   PetscInt          cellDof = 0, numComponents = 0;
5229a559087SMatthew G. Knepley   PetscInt          cellDofAux = 0, numComponentsAux = 0;
523a0845e3aSMatthew G. Knepley   PetscErrorCode    ierr;
524a0845e3aSMatthew G. Knepley 
525a0845e3aSMatthew G. Knepley   PetscFunctionBegin;
526a0845e3aSMatthew G. Knepley   ierr = PetscLogEventBegin(DMPLEX_ResidualFEM,dm,0,0,0);CHKERRQ(ierr);
527a0845e3aSMatthew G. Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
528a0845e3aSMatthew G. Knepley   ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);
5299a559087SMatthew G. Knepley   ierr = PetscSectionGetNumFields(section, &Nf);CHKERRQ(ierr);
530a0845e3aSMatthew G. Knepley   ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr);
531a0845e3aSMatthew G. Knepley   numCells = cEnd - cStart;
5329a559087SMatthew G. Knepley   for (f = 0; f < Nf; ++f) {
533a0845e3aSMatthew G. Knepley     PetscInt Nb, Nc;
534a0845e3aSMatthew G. Knepley 
535a0845e3aSMatthew G. Knepley     ierr = PetscFEGetDimension(fe[f], &Nb);CHKERRQ(ierr);
536a0845e3aSMatthew G. Knepley     ierr = PetscFEGetNumComponents(fe[f], &Nc);CHKERRQ(ierr);
537a0845e3aSMatthew G. Knepley     cellDof       += Nb*Nc;
538a0845e3aSMatthew G. Knepley     numComponents += Nc;
539a0845e3aSMatthew G. Knepley   }
5409a559087SMatthew G. Knepley   ierr = PetscObjectQuery((PetscObject) dm, "dmAux", (PetscObject *) &dmAux);CHKERRQ(ierr);
5419a559087SMatthew G. Knepley   ierr = PetscObjectQuery((PetscObject) dm, "A", (PetscObject *) &A);CHKERRQ(ierr);
5429a559087SMatthew G. Knepley   if (dmAux) {
5439a559087SMatthew G. Knepley     ierr = DMGetDefaultSection(dmAux, &sectionAux);CHKERRQ(ierr);
5449a559087SMatthew G. Knepley     ierr = PetscSectionGetNumFields(sectionAux, &NfAux);CHKERRQ(ierr);
5459a559087SMatthew G. Knepley   }
5469a559087SMatthew G. Knepley   for (f = 0; f < NfAux; ++f) {
5479a559087SMatthew G. Knepley     PetscInt Nb, Nc;
5489a559087SMatthew G. Knepley 
5499a559087SMatthew G. Knepley     ierr = PetscFEGetDimension(feAux[f], &Nb);CHKERRQ(ierr);
5509a559087SMatthew G. Knepley     ierr = PetscFEGetNumComponents(feAux[f], &Nc);CHKERRQ(ierr);
5519a559087SMatthew G. Knepley     cellDofAux       += Nb*Nc;
5529a559087SMatthew G. Knepley     numComponentsAux += Nc;
5539a559087SMatthew G. Knepley   }
55472f94c41SMatthew G. Knepley   ierr = DMPlexProjectFunctionLocal(dm, fe, fem->bcFuncs, INSERT_BC_VALUES, X);CHKERRQ(ierr);
555a0845e3aSMatthew G. Knepley   ierr = VecSet(F, 0.0);CHKERRQ(ierr);
556dcca6d9dSJed Brown   ierr = PetscMalloc6(numCells*cellDof,&u,numCells*dim,&v0,numCells*dim*dim,&J,numCells*dim*dim,&invJ,numCells,&detJ,numCells*cellDof,&elemVec);CHKERRQ(ierr);
557785e854fSJed Brown   if (dmAux) {ierr = PetscMalloc1(numCells*cellDofAux, &a);CHKERRQ(ierr);}
558a0845e3aSMatthew G. Knepley   for (c = cStart; c < cEnd; ++c) {
559a0845e3aSMatthew G. Knepley     PetscScalar *x = NULL;
560a0845e3aSMatthew G. Knepley     PetscInt     i;
561a0845e3aSMatthew G. Knepley 
562a0845e3aSMatthew G. Knepley     ierr = DMPlexComputeCellGeometry(dm, c, &v0[c*dim], &J[c*dim*dim], &invJ[c*dim*dim], &detJ[c]);CHKERRQ(ierr);
563a0845e3aSMatthew G. Knepley     if (detJ[c] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ[c], c);
564a0845e3aSMatthew G. Knepley     ierr = DMPlexVecGetClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr);
565a0845e3aSMatthew G. Knepley     for (i = 0; i < cellDof; ++i) u[c*cellDof+i] = x[i];
566a0845e3aSMatthew G. Knepley     ierr = DMPlexVecRestoreClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr);
5679a559087SMatthew G. Knepley     if (dmAux) {
5689a559087SMatthew G. Knepley       ierr = DMPlexVecGetClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr);
5699a559087SMatthew G. Knepley       for (i = 0; i < cellDofAux; ++i) a[c*cellDofAux+i] = x[i];
5709a559087SMatthew G. Knepley       ierr = DMPlexVecRestoreClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr);
571a0845e3aSMatthew G. Knepley     }
5729a559087SMatthew G. Knepley   }
5739a559087SMatthew G. Knepley   for (f = 0; f < Nf; ++f) {
574c012ea0aSMatthew G. Knepley     void   (*f0)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->f0Funcs[f];
575c012ea0aSMatthew G. Knepley     void   (*f1)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->f1Funcs[f];
576a0845e3aSMatthew G. Knepley     PetscInt Nb;
577a0845e3aSMatthew G. Knepley     /* Conforming batches */
578f30c5766SMatthew G. Knepley     PetscInt numChunks, numBatches, numBlocks, Ne, blockSize, batchSize;
579a0845e3aSMatthew G. Knepley     /* Remainder */
580a0845e3aSMatthew G. Knepley     PetscInt Nr, offset;
581a0845e3aSMatthew G. Knepley 
582a0845e3aSMatthew G. Knepley     ierr = PetscFEGetQuadrature(fe[f], &q);CHKERRQ(ierr);
583a0845e3aSMatthew G. Knepley     ierr = PetscFEGetDimension(fe[f], &Nb);CHKERRQ(ierr);
584f30c5766SMatthew G. Knepley     ierr = PetscFEGetTileSizes(fe[f], NULL, &numBlocks, NULL, &numBatches);CHKERRQ(ierr);
585f9fd7fdbSMatthew G. Knepley     blockSize = Nb*q.numPoints;
586a0845e3aSMatthew G. Knepley     batchSize = numBlocks * blockSize;
587f30c5766SMatthew G. Knepley     ierr =  PetscFESetTileSizes(fe[f], blockSize, numBlocks, batchSize, numBatches);CHKERRQ(ierr);
588a0845e3aSMatthew G. Knepley     numChunks = numCells / (numBatches*batchSize);
589a0845e3aSMatthew G. Knepley     Ne        = numChunks*numBatches*batchSize;
590a0845e3aSMatthew G. Knepley     Nr        = numCells % (numBatches*batchSize);
591a0845e3aSMatthew G. Knepley     offset    = numCells - Nr;
592a0845e3aSMatthew G. Knepley     geom.v0   = v0;
593a0845e3aSMatthew G. Knepley     geom.J    = J;
594a0845e3aSMatthew G. Knepley     geom.invJ = invJ;
595a0845e3aSMatthew G. Knepley     geom.detJ = detJ;
5969a559087SMatthew G. Knepley     ierr = PetscFEIntegrateResidual(fe[f], Ne, Nf, fe, f, geom, u, NfAux, feAux, a, f0, f1, elemVec);CHKERRQ(ierr);
597a0845e3aSMatthew G. Knepley     geom.v0   = &v0[offset*dim];
598a0845e3aSMatthew G. Knepley     geom.J    = &J[offset*dim*dim];
599a0845e3aSMatthew G. Knepley     geom.invJ = &invJ[offset*dim*dim];
600a0845e3aSMatthew G. Knepley     geom.detJ = &detJ[offset];
6019a559087SMatthew G. Knepley     ierr = PetscFEIntegrateResidual(fe[f], Nr, Nf, fe, f, geom, &u[offset*cellDof], NfAux, feAux, &a[offset*cellDofAux], f0, f1, &elemVec[offset*cellDof]);CHKERRQ(ierr);
602a0845e3aSMatthew G. Knepley   }
603a0845e3aSMatthew G. Knepley   for (c = cStart; c < cEnd; ++c) {
604a0845e3aSMatthew G. Knepley     if (mesh->printFEM > 1) {ierr = DMPrintCellVector(c, name, cellDof, &elemVec[c*cellDof]);CHKERRQ(ierr);}
605a0845e3aSMatthew G. Knepley     ierr = DMPlexVecSetClosure(dm, section, F, c, &elemVec[c*cellDof], ADD_VALUES);CHKERRQ(ierr);
606a0845e3aSMatthew G. Knepley   }
607a0845e3aSMatthew G. Knepley   ierr = PetscFree6(u,v0,J,invJ,detJ,elemVec);CHKERRQ(ierr);
6089a559087SMatthew G. Knepley   if (dmAux) {ierr = PetscFree(a);CHKERRQ(ierr);}
609f1ea0e2fSMatthew G. Knepley   if (feBd) {
610075da914SMatthew G. Knepley     DMLabel         label, depth;
611f1ea0e2fSMatthew G. Knepley     IS              pointIS;
612f1ea0e2fSMatthew G. Knepley     const PetscInt *points;
613075da914SMatthew G. Knepley     PetscInt        dep, numPoints, p, numFaces;
614f1ea0e2fSMatthew G. Knepley     PetscReal      *n;
615f1ea0e2fSMatthew G. Knepley 
616f1ea0e2fSMatthew G. Knepley     ierr = DMPlexGetLabel(dm, "boundary", &label);CHKERRQ(ierr);
617075da914SMatthew G. Knepley     ierr = DMPlexGetDepthLabel(dm, &depth);CHKERRQ(ierr);
618f1ea0e2fSMatthew G. Knepley     ierr = DMLabelGetStratumSize(label, 1, &numPoints);CHKERRQ(ierr);
619f1ea0e2fSMatthew G. Knepley     ierr = DMLabelGetStratumIS(label, 1, &pointIS);CHKERRQ(ierr);
620f1ea0e2fSMatthew G. Knepley     ierr = ISGetIndices(pointIS, &points);CHKERRQ(ierr);
621f1ea0e2fSMatthew G. Knepley     for (f = 0, cellDof = 0, numComponents = 0; f < Nf; ++f) {
622f1ea0e2fSMatthew G. Knepley       PetscInt Nb, Nc;
623f1ea0e2fSMatthew G. Knepley 
624f1ea0e2fSMatthew G. Knepley       ierr = PetscFEGetDimension(feBd[f], &Nb);CHKERRQ(ierr);
625f1ea0e2fSMatthew G. Knepley       ierr = PetscFEGetNumComponents(feBd[f], &Nc);CHKERRQ(ierr);
626f1ea0e2fSMatthew G. Knepley       cellDof       += Nb*Nc;
627f1ea0e2fSMatthew G. Knepley       numComponents += Nc;
628f1ea0e2fSMatthew G. Knepley     }
629075da914SMatthew G. Knepley     for (p = 0, numFaces = 0; p < numPoints; ++p) {
630075da914SMatthew G. Knepley       ierr = DMLabelGetValue(depth, points[p], &dep);CHKERRQ(ierr);
631075da914SMatthew G. Knepley       if (dep == dim-1) ++numFaces;
632075da914SMatthew G. Knepley     }
633dcca6d9dSJed Brown     ierr = PetscMalloc7(numFaces*cellDof,&u,numFaces*dim,&v0,numFaces*dim,&n,numFaces*dim*dim,&J,numFaces*dim*dim,&invJ,numFaces,&detJ,numFaces*cellDof,&elemVec);CHKERRQ(ierr);
634075da914SMatthew G. Knepley     for (p = 0, f = 0; p < numPoints; ++p) {
635f1ea0e2fSMatthew G. Knepley       const PetscInt point = points[p];
636f1ea0e2fSMatthew G. Knepley       PetscScalar   *x     = NULL;
637f1ea0e2fSMatthew G. Knepley       PetscInt       i;
638f1ea0e2fSMatthew G. Knepley 
639075da914SMatthew G. Knepley       ierr = DMLabelGetValue(depth, points[p], &dep);CHKERRQ(ierr);
640075da914SMatthew G. Knepley       if (dep != dim-1) continue;
641075da914SMatthew G. Knepley       ierr = DMPlexComputeCellGeometry(dm, point, &v0[f*dim], &J[f*dim*dim], &invJ[f*dim*dim], &detJ[f]);CHKERRQ(ierr);
642a8007bbfSMatthew G. Knepley       ierr = DMPlexComputeCellGeometryFVM(dm, point, NULL, NULL, &n[f*dim]);
643075da914SMatthew G. Knepley       if (detJ[f] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for face %d", detJ[f], point);
644f1ea0e2fSMatthew G. Knepley       ierr = DMPlexVecGetClosure(dm, section, X, point, NULL, &x);CHKERRQ(ierr);
645075da914SMatthew G. Knepley       for (i = 0; i < cellDof; ++i) u[f*cellDof+i] = x[i];
646f1ea0e2fSMatthew G. Knepley       ierr = DMPlexVecRestoreClosure(dm, section, X, point, NULL, &x);CHKERRQ(ierr);
647075da914SMatthew G. Knepley       ++f;
648f1ea0e2fSMatthew G. Knepley     }
649f1ea0e2fSMatthew G. Knepley     for (f = 0; f < Nf; ++f) {
650f1ea0e2fSMatthew G. Knepley       void   (*f0)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], const PetscReal[], PetscScalar[]) = fem->f0BdFuncs[f];
651f1ea0e2fSMatthew G. Knepley       void   (*f1)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], const PetscReal[], PetscScalar[]) = fem->f1BdFuncs[f];
652f1ea0e2fSMatthew G. Knepley       PetscInt Nb;
653f1ea0e2fSMatthew G. Knepley       /* Conforming batches */
654f1ea0e2fSMatthew G. Knepley       PetscInt numChunks, numBatches, numBlocks, Ne, blockSize, batchSize;
655f1ea0e2fSMatthew G. Knepley       /* Remainder */
656f1ea0e2fSMatthew G. Knepley       PetscInt Nr, offset;
657f1ea0e2fSMatthew G. Knepley 
658f1ea0e2fSMatthew G. Knepley       ierr = PetscFEGetQuadrature(feBd[f], &q);CHKERRQ(ierr);
659f1ea0e2fSMatthew G. Knepley       ierr = PetscFEGetDimension(feBd[f], &Nb);CHKERRQ(ierr);
660f1ea0e2fSMatthew G. Knepley       ierr = PetscFEGetTileSizes(feBd[f], NULL, &numBlocks, NULL, &numBatches);CHKERRQ(ierr);
661f9fd7fdbSMatthew G. Knepley       blockSize = Nb*q.numPoints;
662f1ea0e2fSMatthew G. Knepley       batchSize = numBlocks * blockSize;
663f1ea0e2fSMatthew G. Knepley       ierr =  PetscFESetTileSizes(feBd[f], blockSize, numBlocks, batchSize, numBatches);CHKERRQ(ierr);
664075da914SMatthew G. Knepley       numChunks = numFaces / (numBatches*batchSize);
665f1ea0e2fSMatthew G. Knepley       Ne        = numChunks*numBatches*batchSize;
666075da914SMatthew G. Knepley       Nr        = numFaces % (numBatches*batchSize);
667075da914SMatthew G. Knepley       offset    = numFaces - Nr;
668f1ea0e2fSMatthew G. Knepley       geom.v0   = v0;
669f1ea0e2fSMatthew G. Knepley       geom.n    = n;
670f1ea0e2fSMatthew G. Knepley       geom.J    = J;
671f1ea0e2fSMatthew G. Knepley       geom.invJ = invJ;
672f1ea0e2fSMatthew G. Knepley       geom.detJ = detJ;
673f1ea0e2fSMatthew G. Knepley       ierr = PetscFEIntegrateBdResidual(feBd[f], Ne, Nf, feBd, f, geom, u, 0, NULL, NULL, f0, f1, elemVec);CHKERRQ(ierr);
674f1ea0e2fSMatthew G. Knepley       geom.v0   = &v0[offset*dim];
675f1ea0e2fSMatthew G. Knepley       geom.n    = &n[offset*dim];
676f1ea0e2fSMatthew G. Knepley       geom.J    = &J[offset*dim*dim];
677f1ea0e2fSMatthew G. Knepley       geom.invJ = &invJ[offset*dim*dim];
678f1ea0e2fSMatthew G. Knepley       geom.detJ = &detJ[offset];
679f1ea0e2fSMatthew G. Knepley       ierr = PetscFEIntegrateBdResidual(feBd[f], Nr, Nf, feBd, f, geom, &u[offset*cellDof], 0, NULL, NULL, f0, f1, &elemVec[offset*cellDof]);CHKERRQ(ierr);
680f1ea0e2fSMatthew G. Knepley     }
681075da914SMatthew G. Knepley     for (p = 0, f = 0; p < numPoints; ++p) {
682f1ea0e2fSMatthew G. Knepley       const PetscInt point = points[p];
683f1ea0e2fSMatthew G. Knepley 
684075da914SMatthew G. Knepley       ierr = DMLabelGetValue(depth, point, &dep);CHKERRQ(ierr);
685075da914SMatthew G. Knepley       if (dep != dim-1) continue;
686075da914SMatthew G. Knepley       if (mesh->printFEM > 1) {ierr = DMPrintCellVector(point, "BdResidual", cellDof, &elemVec[f*cellDof]);CHKERRQ(ierr);}
687075da914SMatthew G. Knepley       ierr = DMPlexVecSetClosure(dm, NULL, F, point, &elemVec[f*cellDof], ADD_VALUES);CHKERRQ(ierr);
688075da914SMatthew G. Knepley       ++f;
689f1ea0e2fSMatthew G. Knepley     }
690f1ea0e2fSMatthew G. Knepley     ierr = ISRestoreIndices(pointIS, &points);CHKERRQ(ierr);
691f1ea0e2fSMatthew G. Knepley     ierr = ISDestroy(&pointIS);CHKERRQ(ierr);
692f1ea0e2fSMatthew G. Knepley     ierr = PetscFree7(u,v0,n,J,invJ,detJ,elemVec);CHKERRQ(ierr);
693f1ea0e2fSMatthew G. Knepley   }
6946113b454SMatthew G. Knepley   if (mesh->printFEM) {ierr = DMPrintLocalVec(dm, name, mesh->printTol, F);CHKERRQ(ierr);}
695a0845e3aSMatthew G. Knepley   ierr = PetscLogEventEnd(DMPLEX_ResidualFEM,dm,0,0,0);CHKERRQ(ierr);
696a0845e3aSMatthew G. Knepley   PetscFunctionReturn(0);
697a0845e3aSMatthew G. Knepley }
698a0845e3aSMatthew G. Knepley 
699cb1e1211SMatthew G Knepley #undef __FUNCT__
700cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeJacobianActionFEM"
701cb1e1211SMatthew G Knepley /*@C
702cb1e1211SMatthew G Knepley   DMPlexComputeJacobianActionFEM - Form the local action of Jacobian J(u) on the local input X using pointwise functions specified by the user
703cb1e1211SMatthew G Knepley 
704cb1e1211SMatthew G Knepley   Input Parameters:
705cb1e1211SMatthew G Knepley + dm - The mesh
706cb1e1211SMatthew G Knepley . J  - The Jacobian shell matrix
707cb1e1211SMatthew G Knepley . X  - Local input vector
708cb1e1211SMatthew G Knepley - user - The user context
709cb1e1211SMatthew G Knepley 
710cb1e1211SMatthew G Knepley   Output Parameter:
711cb1e1211SMatthew G Knepley . F  - Local output vector
712cb1e1211SMatthew G Knepley 
713cb1e1211SMatthew G Knepley   Note:
714cb1e1211SMatthew G Knepley   The second member of the user context must be an FEMContext.
715cb1e1211SMatthew G Knepley 
716cb1e1211SMatthew G Knepley   We form the residual one batch of elements at a time. This allows us to offload work onto an accelerator,
717cb1e1211SMatthew G Knepley   like a GPU, or vectorize on a multicore machine.
718cb1e1211SMatthew G Knepley 
7190059ad2aSSatish Balay   Level: developer
7200059ad2aSSatish Balay 
721cb1e1211SMatthew G Knepley .seealso: DMPlexComputeResidualFEM()
722878cb397SSatish Balay @*/
723cb1e1211SMatthew G Knepley PetscErrorCode DMPlexComputeJacobianActionFEM(DM dm, Mat Jac, Vec X, Vec F, void *user)
724cb1e1211SMatthew G Knepley {
725cb1e1211SMatthew G Knepley   DM_Plex          *mesh = (DM_Plex *) dm->data;
7269a559087SMatthew G. Knepley   PetscFEM         *fem  = (PetscFEM *) user;
7270483ade4SMatthew G. Knepley   PetscFE          *fe   = fem->fe;
7280483ade4SMatthew G. Knepley   PetscQuadrature   quad;
7290483ade4SMatthew G. Knepley   PetscCellGeometry geom;
730cb1e1211SMatthew G Knepley   PetscSection      section;
731cb1e1211SMatthew G Knepley   JacActionCtx     *jctx;
732cb1e1211SMatthew G Knepley   PetscReal        *v0, *J, *invJ, *detJ;
733cb1e1211SMatthew G Knepley   PetscScalar      *elemVec, *u, *a;
7340483ade4SMatthew G. Knepley   PetscInt          dim, numFields, field, numCells, cStart, cEnd, c;
735cb1e1211SMatthew G Knepley   PetscInt          cellDof = 0;
736cb1e1211SMatthew G Knepley   PetscErrorCode    ierr;
737cb1e1211SMatthew G Knepley 
738cb1e1211SMatthew G Knepley   PetscFunctionBegin;
7390483ade4SMatthew G. Knepley   /* ierr = PetscLogEventBegin(DMPLEX_JacobianActionFEM,dm,0,0,0);CHKERRQ(ierr); */
740cb1e1211SMatthew G Knepley   ierr = MatShellGetContext(Jac, &jctx);CHKERRQ(ierr);
741cb1e1211SMatthew G Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
742cb1e1211SMatthew G Knepley   ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);
743cb1e1211SMatthew G Knepley   ierr = PetscSectionGetNumFields(section, &numFields);CHKERRQ(ierr);
744cb1e1211SMatthew G Knepley   ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr);
745cb1e1211SMatthew G Knepley   numCells = cEnd - cStart;
746cb1e1211SMatthew G Knepley   for (field = 0; field < numFields; ++field) {
7470483ade4SMatthew G. Knepley     PetscInt Nb, Nc;
7480483ade4SMatthew G. Knepley 
7490483ade4SMatthew G. Knepley     ierr = PetscFEGetDimension(fe[field], &Nb);CHKERRQ(ierr);
7500483ade4SMatthew G. Knepley     ierr = PetscFEGetNumComponents(fe[field], &Nc);CHKERRQ(ierr);
7510483ade4SMatthew G. Knepley     cellDof += Nb*Nc;
752cb1e1211SMatthew G Knepley   }
753cb1e1211SMatthew G Knepley   ierr = VecSet(F, 0.0);CHKERRQ(ierr);
754dcca6d9dSJed Brown   ierr = PetscMalloc7(numCells*cellDof,&u,numCells*cellDof,&a,numCells*dim,&v0,numCells*dim*dim,&J,numCells*dim*dim,&invJ,numCells,&detJ,numCells*cellDof,&elemVec);CHKERRQ(ierr);
755cb1e1211SMatthew G Knepley   for (c = cStart; c < cEnd; ++c) {
756a1e44745SMatthew G. Knepley     PetscScalar *x = NULL;
757cb1e1211SMatthew G Knepley     PetscInt     i;
758cb1e1211SMatthew G Knepley 
759cb1e1211SMatthew G Knepley     ierr = DMPlexComputeCellGeometry(dm, c, &v0[c*dim], &J[c*dim*dim], &invJ[c*dim*dim], &detJ[c]);CHKERRQ(ierr);
760cb1e1211SMatthew G Knepley     if (detJ[c] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ[c], c);
761cb1e1211SMatthew G Knepley     ierr = DMPlexVecGetClosure(dm, NULL, jctx->u, c, NULL, &x);CHKERRQ(ierr);
762cb1e1211SMatthew G Knepley     for (i = 0; i < cellDof; ++i) u[c*cellDof+i] = x[i];
763cb1e1211SMatthew G Knepley     ierr = DMPlexVecRestoreClosure(dm, NULL, jctx->u, c, NULL, &x);CHKERRQ(ierr);
764cb1e1211SMatthew G Knepley     ierr = DMPlexVecGetClosure(dm, NULL, X, c, NULL, &x);CHKERRQ(ierr);
765cb1e1211SMatthew G Knepley     for (i = 0; i < cellDof; ++i) a[c*cellDof+i] = x[i];
766cb1e1211SMatthew G Knepley     ierr = DMPlexVecRestoreClosure(dm, NULL, X, c, NULL, &x);CHKERRQ(ierr);
767cb1e1211SMatthew G Knepley   }
768cb1e1211SMatthew G Knepley   for (field = 0; field < numFields; ++field) {
7690483ade4SMatthew G. Knepley     PetscInt Nb;
770cb1e1211SMatthew G Knepley     /* Conforming batches */
771cb1e1211SMatthew G Knepley     PetscInt numBlocks  = 1;
7720483ade4SMatthew G. Knepley     PetscInt numBatches = 1;
7730483ade4SMatthew G. Knepley     PetscInt numChunks, Ne, blockSize, batchSize;
774cb1e1211SMatthew G Knepley     /* Remainder */
7750483ade4SMatthew G. Knepley     PetscInt Nr, offset;
776cb1e1211SMatthew G Knepley 
7770483ade4SMatthew G. Knepley     ierr = PetscFEGetQuadrature(fe[field], &quad);CHKERRQ(ierr);
7780483ade4SMatthew G. Knepley     ierr = PetscFEGetDimension(fe[field], &Nb);CHKERRQ(ierr);
779f9fd7fdbSMatthew G. Knepley     blockSize = Nb*quad.numPoints;
7800483ade4SMatthew G. Knepley     batchSize = numBlocks * blockSize;
7810483ade4SMatthew G. Knepley     numChunks = numCells / (numBatches*batchSize);
7820483ade4SMatthew G. Knepley     Ne        = numChunks*numBatches*batchSize;
7830483ade4SMatthew G. Knepley     Nr        = numCells % (numBatches*batchSize);
7840483ade4SMatthew G. Knepley     offset    = numCells - Nr;
7850483ade4SMatthew G. Knepley     geom.v0   = v0;
7860483ade4SMatthew G. Knepley     geom.J    = J;
7870483ade4SMatthew G. Knepley     geom.invJ = invJ;
7880483ade4SMatthew G. Knepley     geom.detJ = detJ;
7890483ade4SMatthew G. Knepley     ierr = PetscFEIntegrateJacobianAction(fe[field], Ne, numFields, fe, field, geom, u, a, fem->g0Funcs, fem->g1Funcs, fem->g2Funcs, fem->g3Funcs, elemVec);CHKERRQ(ierr);
7900483ade4SMatthew G. Knepley     geom.v0   = &v0[offset*dim];
7910483ade4SMatthew G. Knepley     geom.J    = &J[offset*dim*dim];
7920483ade4SMatthew G. Knepley     geom.invJ = &invJ[offset*dim*dim];
7930483ade4SMatthew G. Knepley     geom.detJ = &detJ[offset];
7940483ade4SMatthew G. Knepley     ierr = PetscFEIntegrateJacobianAction(fe[field], Nr, numFields, fe, field, geom, &u[offset*cellDof], &a[offset*cellDof],
795cb1e1211SMatthew G Knepley                                           fem->g0Funcs, fem->g1Funcs, fem->g2Funcs, fem->g3Funcs, &elemVec[offset*cellDof]);CHKERRQ(ierr);
796cb1e1211SMatthew G Knepley   }
797cb1e1211SMatthew G Knepley   for (c = cStart; c < cEnd; ++c) {
798cb1e1211SMatthew G Knepley     if (mesh->printFEM > 1) {ierr = DMPrintCellVector(c, "Jacobian Action", cellDof, &elemVec[c*cellDof]);CHKERRQ(ierr);}
799cb1e1211SMatthew G Knepley     ierr = DMPlexVecSetClosure(dm, NULL, F, c, &elemVec[c*cellDof], ADD_VALUES);CHKERRQ(ierr);
800cb1e1211SMatthew G Knepley   }
801cb1e1211SMatthew G Knepley   ierr = PetscFree7(u,a,v0,J,invJ,detJ,elemVec);CHKERRQ(ierr);
802cb1e1211SMatthew G Knepley   if (mesh->printFEM) {
803cb1e1211SMatthew G Knepley     PetscMPIInt rank, numProcs;
804cb1e1211SMatthew G Knepley     PetscInt    p;
805cb1e1211SMatthew G Knepley 
806cb1e1211SMatthew G Knepley     ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)dm), &rank);CHKERRQ(ierr);
807cb1e1211SMatthew G Knepley     ierr = MPI_Comm_size(PetscObjectComm((PetscObject)dm), &numProcs);CHKERRQ(ierr);
80886a74ee0SMatthew G. Knepley     ierr = PetscPrintf(PetscObjectComm((PetscObject)dm), "Jacobian Action:\n");CHKERRQ(ierr);
809cb1e1211SMatthew G Knepley     for (p = 0; p < numProcs; ++p) {
810cb1e1211SMatthew G Knepley       if (p == rank) {ierr = VecView(F, PETSC_VIEWER_STDOUT_SELF);CHKERRQ(ierr);}
811cb1e1211SMatthew G Knepley       ierr = PetscBarrier((PetscObject) dm);CHKERRQ(ierr);
812cb1e1211SMatthew G Knepley     }
813cb1e1211SMatthew G Knepley   }
8140483ade4SMatthew G. Knepley   /* ierr = PetscLogEventEnd(DMPLEX_JacobianActionFEM,dm,0,0,0);CHKERRQ(ierr); */
815cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
816cb1e1211SMatthew G Knepley }
817cb1e1211SMatthew G Knepley 
818cb1e1211SMatthew G Knepley #undef __FUNCT__
819cb1e1211SMatthew G Knepley #define __FUNCT__ "DMPlexComputeJacobianFEM"
820cb1e1211SMatthew G Knepley /*@
821cb1e1211SMatthew G Knepley   DMPlexComputeJacobianFEM - Form the local portion of the Jacobian matrix J at the local solution X using pointwise functions specified by the user.
822cb1e1211SMatthew G Knepley 
823cb1e1211SMatthew G Knepley   Input Parameters:
824cb1e1211SMatthew G Knepley + dm - The mesh
825cb1e1211SMatthew G Knepley . X  - Local input vector
826cb1e1211SMatthew G Knepley - user - The user context
827cb1e1211SMatthew G Knepley 
828cb1e1211SMatthew G Knepley   Output Parameter:
829cb1e1211SMatthew G Knepley . Jac  - Jacobian matrix
830cb1e1211SMatthew G Knepley 
831cb1e1211SMatthew G Knepley   Note:
832cb1e1211SMatthew G Knepley   The second member of the user context must be an FEMContext.
833cb1e1211SMatthew G Knepley 
834cb1e1211SMatthew G Knepley   We form the residual one batch of elements at a time. This allows us to offload work onto an accelerator,
835cb1e1211SMatthew G Knepley   like a GPU, or vectorize on a multicore machine.
836cb1e1211SMatthew G Knepley 
8370059ad2aSSatish Balay   Level: developer
8380059ad2aSSatish Balay 
839cb1e1211SMatthew G Knepley .seealso: FormFunctionLocal()
840878cb397SSatish Balay @*/
841cb1e1211SMatthew G Knepley PetscErrorCode DMPlexComputeJacobianFEM(DM dm, Vec X, Mat Jac, Mat JacP, MatStructure *str,void *user)
842cb1e1211SMatthew G Knepley {
843cb1e1211SMatthew G Knepley   DM_Plex          *mesh  = (DM_Plex *) dm->data;
8449a559087SMatthew G. Knepley   PetscFEM         *fem   = (PetscFEM *) user;
845a319912fSMatthew G. Knepley   PetscFE          *fe    = fem->fe;
846754551f4SMatthew G. Knepley   PetscFE          *feAux = fem->feAux;
847a319912fSMatthew G. Knepley   const char       *name  = "Jacobian";
848754551f4SMatthew G. Knepley   DM                dmAux;
849754551f4SMatthew G. Knepley   Vec               A;
850a319912fSMatthew G. Knepley   PetscQuadrature   quad;
851a319912fSMatthew G. Knepley   PetscCellGeometry geom;
852754551f4SMatthew G. Knepley   PetscSection      section, globalSection, sectionAux;
853cb1e1211SMatthew G Knepley   PetscReal        *v0, *J, *invJ, *detJ;
854754551f4SMatthew G. Knepley   PetscScalar      *elemMat, *u, *a;
855754551f4SMatthew G. Knepley   PetscInt          dim, Nf, NfAux = 0, f, fieldI, fieldJ, numCells, cStart, cEnd, c;
856cb1e1211SMatthew G Knepley   PetscInt          cellDof = 0, numComponents = 0;
857754551f4SMatthew G. Knepley   PetscInt          cellDofAux = 0, numComponentsAux = 0;
858cb1e1211SMatthew G Knepley   PetscBool         isShell;
859cb1e1211SMatthew G Knepley   PetscErrorCode    ierr;
860cb1e1211SMatthew G Knepley 
861cb1e1211SMatthew G Knepley   PetscFunctionBegin;
862a319912fSMatthew G. Knepley   ierr = PetscLogEventBegin(DMPLEX_JacobianFEM,dm,0,0,0);CHKERRQ(ierr);
863cb1e1211SMatthew G Knepley   ierr = DMPlexGetDimension(dm, &dim);CHKERRQ(ierr);
864cb1e1211SMatthew G Knepley   ierr = DMGetDefaultSection(dm, &section);CHKERRQ(ierr);
865a319912fSMatthew G. Knepley   ierr = DMGetDefaultGlobalSection(dm, &globalSection);CHKERRQ(ierr);
866754551f4SMatthew G. Knepley   ierr = PetscSectionGetNumFields(section, &Nf);CHKERRQ(ierr);
867cb1e1211SMatthew G Knepley   ierr = DMPlexGetHeightStratum(dm, 0, &cStart, &cEnd);CHKERRQ(ierr);
868cb1e1211SMatthew G Knepley   numCells = cEnd - cStart;
869754551f4SMatthew G. Knepley   for (f = 0; f < Nf; ++f) {
870a319912fSMatthew G. Knepley     PetscInt Nb, Nc;
871a319912fSMatthew G. Knepley 
872a319912fSMatthew G. Knepley     ierr = PetscFEGetDimension(fe[f], &Nb);CHKERRQ(ierr);
873a319912fSMatthew G. Knepley     ierr = PetscFEGetNumComponents(fe[f], &Nc);CHKERRQ(ierr);
874a319912fSMatthew G. Knepley     cellDof       += Nb*Nc;
875a319912fSMatthew G. Knepley     numComponents += Nc;
876cb1e1211SMatthew G Knepley   }
877754551f4SMatthew G. Knepley   ierr = PetscObjectQuery((PetscObject) dm, "dmAux", (PetscObject *) &dmAux);CHKERRQ(ierr);
878754551f4SMatthew G. Knepley   ierr = PetscObjectQuery((PetscObject) dm, "A", (PetscObject *) &A);CHKERRQ(ierr);
879754551f4SMatthew G. Knepley   if (dmAux) {
880754551f4SMatthew G. Knepley     ierr = DMGetDefaultSection(dmAux, &sectionAux);CHKERRQ(ierr);
881754551f4SMatthew G. Knepley     ierr = PetscSectionGetNumFields(sectionAux, &NfAux);CHKERRQ(ierr);
882754551f4SMatthew G. Knepley   }
883754551f4SMatthew G. Knepley   for (f = 0; f < NfAux; ++f) {
884754551f4SMatthew G. Knepley     PetscInt Nb, Nc;
885754551f4SMatthew G. Knepley 
886754551f4SMatthew G. Knepley     ierr = PetscFEGetDimension(feAux[f], &Nb);CHKERRQ(ierr);
887754551f4SMatthew G. Knepley     ierr = PetscFEGetNumComponents(feAux[f], &Nc);CHKERRQ(ierr);
888754551f4SMatthew G. Knepley     cellDofAux       += Nb*Nc;
889754551f4SMatthew G. Knepley     numComponentsAux += Nc;
890754551f4SMatthew G. Knepley   }
89172f94c41SMatthew G. Knepley   ierr = DMPlexProjectFunctionLocal(dm, fe, fem->bcFuncs, INSERT_BC_VALUES, X);CHKERRQ(ierr);
892cb1e1211SMatthew G Knepley   ierr = MatZeroEntries(JacP);CHKERRQ(ierr);
893dcca6d9dSJed Brown   ierr = PetscMalloc6(numCells*cellDof,&u,numCells*dim,&v0,numCells*dim*dim,&J,numCells*dim*dim,&invJ,numCells,&detJ,numCells*cellDof*cellDof,&elemMat);CHKERRQ(ierr);
894785e854fSJed Brown   if (dmAux) {ierr = PetscMalloc1(numCells*cellDofAux, &a);CHKERRQ(ierr);}
895cb1e1211SMatthew G Knepley   for (c = cStart; c < cEnd; ++c) {
896a1e44745SMatthew G. Knepley     PetscScalar *x = NULL;
897cb1e1211SMatthew G Knepley     PetscInt     i;
898cb1e1211SMatthew G Knepley 
899cb1e1211SMatthew G Knepley     ierr = DMPlexComputeCellGeometry(dm, c, &v0[c*dim], &J[c*dim*dim], &invJ[c*dim*dim], &detJ[c]);CHKERRQ(ierr);
900cb1e1211SMatthew G Knepley     if (detJ[c] <= 0.0) SETERRQ2(PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Invalid determinant %g for element %d", detJ[c], c);
901a319912fSMatthew G. Knepley     ierr = DMPlexVecGetClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr);
902cb1e1211SMatthew G Knepley     for (i = 0; i < cellDof; ++i) u[c*cellDof+i] = x[i];
903a319912fSMatthew G. Knepley     ierr = DMPlexVecRestoreClosure(dm, section, X, c, NULL, &x);CHKERRQ(ierr);
904754551f4SMatthew G. Knepley     if (dmAux) {
905754551f4SMatthew G. Knepley       ierr = DMPlexVecGetClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr);
906754551f4SMatthew G. Knepley       for (i = 0; i < cellDofAux; ++i) a[c*cellDofAux+i] = x[i];
907754551f4SMatthew G. Knepley       ierr = DMPlexVecRestoreClosure(dmAux, sectionAux, A, c, NULL, &x);CHKERRQ(ierr);
908754551f4SMatthew G. Knepley     }
909cb1e1211SMatthew G Knepley   }
910cb1e1211SMatthew G Knepley   ierr = PetscMemzero(elemMat, numCells*cellDof*cellDof * sizeof(PetscScalar));CHKERRQ(ierr);
911754551f4SMatthew G. Knepley   for (fieldI = 0; fieldI < Nf; ++fieldI) {
912a319912fSMatthew G. Knepley     PetscInt Nb;
913cb1e1211SMatthew G Knepley     /* Conforming batches */
914754551f4SMatthew G. Knepley     PetscInt numChunks, numBatches, numBlocks, Ne, blockSize, batchSize;
915cb1e1211SMatthew G Knepley     /* Remainder */
916a319912fSMatthew G. Knepley     PetscInt Nr, offset;
917cb1e1211SMatthew G Knepley 
918754551f4SMatthew G. Knepley     ierr = PetscFEGetQuadrature(fe[fieldI], &quad);CHKERRQ(ierr);
919754551f4SMatthew G. Knepley     ierr = PetscFEGetDimension(fe[fieldI], &Nb);CHKERRQ(ierr);
920754551f4SMatthew G. Knepley     ierr = PetscFEGetTileSizes(fe[fieldI], NULL, &numBlocks, NULL, &numBatches);CHKERRQ(ierr);
921f9fd7fdbSMatthew G. Knepley     blockSize = Nb*quad.numPoints;
922a319912fSMatthew G. Knepley     batchSize = numBlocks * blockSize;
923754551f4SMatthew G. Knepley     ierr = PetscFESetTileSizes(fe[fieldI], blockSize, numBlocks, batchSize, numBatches);CHKERRQ(ierr);
924a319912fSMatthew G. Knepley     numChunks = numCells / (numBatches*batchSize);
925a319912fSMatthew G. Knepley     Ne        = numChunks*numBatches*batchSize;
926a319912fSMatthew G. Knepley     Nr        = numCells % (numBatches*batchSize);
927a319912fSMatthew G. Knepley     offset    = numCells - Nr;
928754551f4SMatthew G. Knepley     for (fieldJ = 0; fieldJ < Nf; ++fieldJ) {
929754551f4SMatthew G. Knepley       void   (*g0)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g0Funcs[fieldI*Nf+fieldJ];
930754551f4SMatthew G. Knepley       void   (*g1)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g1Funcs[fieldI*Nf+fieldJ];
931754551f4SMatthew G. Knepley       void   (*g2)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g2Funcs[fieldI*Nf+fieldJ];
932754551f4SMatthew G. Knepley       void   (*g3)(const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscScalar[], const PetscReal[], PetscScalar[]) = fem->g3Funcs[fieldI*Nf+fieldJ];
933754551f4SMatthew G. Knepley 
934a319912fSMatthew G. Knepley       geom.v0   = v0;
935a319912fSMatthew G. Knepley       geom.J    = J;
936a319912fSMatthew G. Knepley       geom.invJ = invJ;
937a319912fSMatthew G. Knepley       geom.detJ = detJ;
938754551f4SMatthew G. Knepley       ierr = PetscFEIntegrateJacobian(fe[fieldI], Ne, Nf, fe, fieldI, fieldJ, geom, u, NfAux, feAux, a, g0, g1, g2, g3, elemMat);CHKERRQ(ierr);
939a319912fSMatthew G. Knepley       geom.v0   = &v0[offset*dim];
940a319912fSMatthew G. Knepley       geom.J    = &J[offset*dim*dim];
941a319912fSMatthew G. Knepley       geom.invJ = &invJ[offset*dim*dim];
942a319912fSMatthew G. Knepley       geom.detJ = &detJ[offset];
943754551f4SMatthew G. Knepley       ierr = PetscFEIntegrateJacobian(fe[fieldI], Nr, Nf, fe, fieldI, fieldJ, geom, &u[offset*cellDof], NfAux, feAux, &a[offset*cellDofAux], g0, g1, g2, g3, &elemMat[offset*cellDof*cellDof]);CHKERRQ(ierr);
944cb1e1211SMatthew G Knepley     }
945cb1e1211SMatthew G Knepley   }
946cb1e1211SMatthew G Knepley   for (c = cStart; c < cEnd; ++c) {
947a319912fSMatthew G. Knepley     if (mesh->printFEM > 1) {ierr = DMPrintCellMatrix(c, name, cellDof, cellDof, &elemMat[c*cellDof*cellDof]);CHKERRQ(ierr);}
948a319912fSMatthew G. Knepley     ierr = DMPlexMatSetClosure(dm, section, globalSection, JacP, c, &elemMat[c*cellDof*cellDof], ADD_VALUES);CHKERRQ(ierr);
949cb1e1211SMatthew G Knepley   }
950cb1e1211SMatthew G Knepley   ierr = PetscFree6(u,v0,J,invJ,detJ,elemMat);CHKERRQ(ierr);
951754551f4SMatthew G. Knepley   if (dmAux) {ierr = PetscFree(a);CHKERRQ(ierr);}
952cb1e1211SMatthew G Knepley   ierr = MatAssemblyBegin(JacP, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
953cb1e1211SMatthew G Knepley   ierr = MatAssemblyEnd(JacP, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
954cb1e1211SMatthew G Knepley   if (mesh->printFEM) {
955a319912fSMatthew G. Knepley     ierr = PetscPrintf(PETSC_COMM_WORLD, "%s:\n", name);CHKERRQ(ierr);
956cb1e1211SMatthew G Knepley     ierr = MatChop(JacP, 1.0e-10);CHKERRQ(ierr);
957cb1e1211SMatthew G Knepley     ierr = MatView(JacP, PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr);
958cb1e1211SMatthew G Knepley   }
959a319912fSMatthew G. Knepley   ierr = PetscLogEventEnd(DMPLEX_JacobianFEM,dm,0,0,0);CHKERRQ(ierr);
960cb1e1211SMatthew G Knepley   ierr = PetscObjectTypeCompare((PetscObject) Jac, MATSHELL, &isShell);CHKERRQ(ierr);
961cb1e1211SMatthew G Knepley   if (isShell) {
962cb1e1211SMatthew G Knepley     JacActionCtx *jctx;
963cb1e1211SMatthew G Knepley 
964cb1e1211SMatthew G Knepley     ierr = MatShellGetContext(Jac, &jctx);CHKERRQ(ierr);
965cb1e1211SMatthew G Knepley     ierr = VecCopy(X, jctx->u);CHKERRQ(ierr);
966cb1e1211SMatthew G Knepley   }
967cb1e1211SMatthew G Knepley   *str = SAME_NONZERO_PATTERN;
968cb1e1211SMatthew G Knepley   PetscFunctionReturn(0);
969cb1e1211SMatthew G Knepley }
970