xref: /libCEED/examples/mfem/bp3.hpp (revision 182fbe45946cf03cf477817c69381239c28d901b)
1*182fbe45STzanio // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
2*182fbe45STzanio // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
3*182fbe45STzanio // reserved. See files LICENSE and NOTICE for details.
4*182fbe45STzanio //
5*182fbe45STzanio // This file is part of CEED, a collection of benchmarks, miniapps, software
6*182fbe45STzanio // libraries and APIs for efficient high-order finite element and spectral
7*182fbe45STzanio // element discretizations for exascale applications. For more information and
8*182fbe45STzanio // source code availability see http://github.com/ceed.
9*182fbe45STzanio //
10*182fbe45STzanio // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11*182fbe45STzanio // a collaborative effort of two U.S. Department of Energy organizations (Office
12*182fbe45STzanio // of Science and the National Nuclear Security Administration) responsible for
13*182fbe45STzanio // the planning and preparation of a capable exascale ecosystem, including
14*182fbe45STzanio // software, applications, hardware, advanced system engineering and early
15*182fbe45STzanio // testbed platforms, in support of the nation's exascale computing imperative.
16*182fbe45STzanio 
17*182fbe45STzanio /// @file
18*182fbe45STzanio /// MFEM diffusion operator based on libCEED
19*182fbe45STzanio 
20*182fbe45STzanio #include <ceed.h>
21*182fbe45STzanio #include <mfem.hpp>
22*182fbe45STzanio 
23*182fbe45STzanio /// A structure used to pass additional data to f_build_diff and f_apply_diff
24*182fbe45STzanio struct DiffContext { CeedInt dim, space_dim; };
25*182fbe45STzanio 
26*182fbe45STzanio /// libCEED Q-function for building quadrature data for a diffusion operator
27*182fbe45STzanio static int f_build_diff(void *ctx, void *qdata, CeedInt Q,
28*182fbe45STzanio                         const CeedScalar *const *u, CeedScalar *const *v) {
29*182fbe45STzanio   // u[1] is Jacobians, size (Q x nc x dim) with column-major layout
30*182fbe45STzanio   // u[4] is quadrature weights, size (Q)
31*182fbe45STzanio   //
32*182fbe45STzanio   // At every quadrature point, compute qw/det(J).adj(J).adj(J)^T and store
33*182fbe45STzanio   // the symmetric part of the result.
34*182fbe45STzanio   DiffContext *dc = (DiffContext*)ctx;
35*182fbe45STzanio   CeedScalar *qd = (CeedScalar*)qdata;
36*182fbe45STzanio   const CeedScalar *J = u[1], *qw = u[4];
37*182fbe45STzanio   switch (dc->dim + 10*dc->space_dim) {
38*182fbe45STzanio   case 11:
39*182fbe45STzanio     for (CeedInt i=0; i<Q; i++) {
40*182fbe45STzanio       qd[i] = qw[i] / J[i];
41*182fbe45STzanio     }
42*182fbe45STzanio     break;
43*182fbe45STzanio   case 22:
44*182fbe45STzanio     for (CeedInt i=0; i<Q; i++) {
45*182fbe45STzanio       // J: 0 2   qd: 0 1   adj(J):  J22 -J12
46*182fbe45STzanio       //    1 3       1 2           -J21  J11
47*182fbe45STzanio       const CeedScalar J11 = J[i+Q*0];
48*182fbe45STzanio       const CeedScalar J21 = J[i+Q*1];
49*182fbe45STzanio       const CeedScalar J12 = J[i+Q*2];
50*182fbe45STzanio       const CeedScalar J22 = J[i+Q*3];
51*182fbe45STzanio       const CeedScalar w = qw[i] / (J11*J22 - J21*J12);
52*182fbe45STzanio       qd[i+Q*0] =   w * (J12*J12 + J22*J22);
53*182fbe45STzanio       qd[i+Q*1] = - w * (J11*J12 + J21*J22);
54*182fbe45STzanio       qd[i+Q*2] =   w * (J11*J11 + J21*J21);
55*182fbe45STzanio     }
56*182fbe45STzanio     break;
57*182fbe45STzanio   case 33:
58*182fbe45STzanio     for (CeedInt i=0; i<Q; i++) {
59*182fbe45STzanio       // J: 0 3 6   qd: 0 1 2
60*182fbe45STzanio       //    1 4 7       1 3 4
61*182fbe45STzanio       //    2 5 8       2 4 5
62*182fbe45STzanio       const CeedScalar J11 = J[i+Q*0];
63*182fbe45STzanio       const CeedScalar J21 = J[i+Q*1];
64*182fbe45STzanio       const CeedScalar J31 = J[i+Q*2];
65*182fbe45STzanio       const CeedScalar J12 = J[i+Q*3];
66*182fbe45STzanio       const CeedScalar J22 = J[i+Q*4];
67*182fbe45STzanio       const CeedScalar J32 = J[i+Q*5];
68*182fbe45STzanio       const CeedScalar J13 = J[i+Q*6];
69*182fbe45STzanio       const CeedScalar J23 = J[i+Q*7];
70*182fbe45STzanio       const CeedScalar J33 = J[i+Q*8];
71*182fbe45STzanio       const CeedScalar A11 = J22*J33 - J23*J32;
72*182fbe45STzanio       const CeedScalar A12 = J13*J32 - J12*J33;
73*182fbe45STzanio       const CeedScalar A13 = J12*J23 - J13*J22;
74*182fbe45STzanio       const CeedScalar A21 = J23*J31 - J21*J33;
75*182fbe45STzanio       const CeedScalar A22 = J11*J33 - J13*J31;
76*182fbe45STzanio       const CeedScalar A23 = J13*J21 - J11*J23;
77*182fbe45STzanio       const CeedScalar A31 = J21*J32 - J22*J31;
78*182fbe45STzanio       const CeedScalar A32 = J12*J31 - J11*J32;
79*182fbe45STzanio       const CeedScalar A33 = J11*J22 - J12*J21;
80*182fbe45STzanio       const CeedScalar w = qw[i] / (J11*A11 + J21*A12 + J31*A13);
81*182fbe45STzanio       qd[i+Q*0] = w * (A11*A11 + A12*A12 + A13*A13);
82*182fbe45STzanio       qd[i+Q*1] = w * (A11*A21 + A12*A22 + A13*A23);
83*182fbe45STzanio       qd[i+Q*2] = w * (A11*A31 + A12*A32 + A13*A33);
84*182fbe45STzanio       qd[i+Q*3] = w * (A21*A21 + A22*A22 + A23*A23);
85*182fbe45STzanio       qd[i+Q*4] = w * (A21*A31 + A22*A32 + A23*A33);
86*182fbe45STzanio       qd[i+Q*5] = w * (A31*A31 + A32*A32 + A33*A33);
87*182fbe45STzanio     }
88*182fbe45STzanio     break;
89*182fbe45STzanio   default:
90*182fbe45STzanio     return CeedError(NULL, 1, "dim=%d, space_dim=%d is not supported",
91*182fbe45STzanio                      dc->dim, dc->space_dim);
92*182fbe45STzanio   }
93*182fbe45STzanio   return 0;
94*182fbe45STzanio }
95*182fbe45STzanio 
96*182fbe45STzanio /// libCEED Q-function for applying a diff operator
97*182fbe45STzanio static int f_apply_diff(void *ctx, void *qdata, CeedInt Q,
98*182fbe45STzanio                         const CeedScalar *const *u, CeedScalar *const *v) {
99*182fbe45STzanio   DiffContext *dc = (DiffContext*)ctx;
100*182fbe45STzanio   const CeedScalar *qd = (const CeedScalar*)qdata;
101*182fbe45STzanio   // u[1], v[1]: size: (Q x nc x dim) with column-major layout (nc == 1)
102*182fbe45STzanio   const CeedScalar *ug = u[1];
103*182fbe45STzanio   CeedScalar *vg = v[1];
104*182fbe45STzanio   switch (dc->dim) {
105*182fbe45STzanio   case 1:
106*182fbe45STzanio     for (CeedInt i=0; i<Q; i++) {
107*182fbe45STzanio       vg[i] = ug[i] * qd[i];
108*182fbe45STzanio     }
109*182fbe45STzanio     break;
110*182fbe45STzanio   case 2:
111*182fbe45STzanio     for (CeedInt i=0; i<Q; i++) {
112*182fbe45STzanio       const CeedScalar ug0 = ug[i+Q*0];
113*182fbe45STzanio       const CeedScalar ug1 = ug[i+Q*1];
114*182fbe45STzanio       vg[i+Q*0] = qd[i+Q*0]*ug0 + qd[i+Q*1]*ug1;
115*182fbe45STzanio       vg[i+Q*1] = qd[i+Q*1]*ug0 + qd[i+Q*2]*ug1;
116*182fbe45STzanio     }
117*182fbe45STzanio     break;
118*182fbe45STzanio   case 3:
119*182fbe45STzanio     for (CeedInt i=0; i<Q; i++) {
120*182fbe45STzanio       const CeedScalar ug0 = ug[i+Q*0];
121*182fbe45STzanio       const CeedScalar ug1 = ug[i+Q*1];
122*182fbe45STzanio       const CeedScalar ug2 = ug[i+Q*2];
123*182fbe45STzanio       vg[i+Q*0] = qd[i+Q*0]*ug0 + qd[i+Q*1]*ug1 + qd[i+Q*2]*ug2;
124*182fbe45STzanio       vg[i+Q*1] = qd[i+Q*1]*ug0 + qd[i+Q*3]*ug1 + qd[i+Q*4]*ug2;
125*182fbe45STzanio       vg[i+Q*2] = qd[i+Q*2]*ug0 + qd[i+Q*4]*ug1 + qd[i+Q*5]*ug2;
126*182fbe45STzanio     }
127*182fbe45STzanio     break;
128*182fbe45STzanio   default:
129*182fbe45STzanio     return CeedError(NULL, 1, "topo_dim=%d is not supported", dc->dim);
130*182fbe45STzanio   }
131*182fbe45STzanio   return 0;
132*182fbe45STzanio }
133*182fbe45STzanio 
134*182fbe45STzanio /// Wrapper for a diffusion CeedOperator as an mfem::Operator
135*182fbe45STzanio class CeedDiffusionOperator : public mfem::Operator {
136*182fbe45STzanio  protected:
137*182fbe45STzanio   const mfem::FiniteElementSpace *fes;
138*182fbe45STzanio   CeedOperator build_oper, oper;
139*182fbe45STzanio   CeedBasis basis, mesh_basis;
140*182fbe45STzanio   CeedElemRestriction restr, mesh_restr;
141*182fbe45STzanio   CeedQFunction apply_qfunc, build_qfunc;
142*182fbe45STzanio   CeedVector node_coords, qdata;
143*182fbe45STzanio 
144*182fbe45STzanio   DiffContext diff_ctx;
145*182fbe45STzanio 
146*182fbe45STzanio   CeedVector u, v;
147*182fbe45STzanio 
148*182fbe45STzanio   static void FESpace2Ceed(const mfem::FiniteElementSpace *fes,
149*182fbe45STzanio                            const mfem::IntegrationRule &ir,
150*182fbe45STzanio                            Ceed ceed, CeedBasis *basis,
151*182fbe45STzanio                            CeedElemRestriction *restr) {
152*182fbe45STzanio     mfem::Mesh *mesh = fes->GetMesh();
153*182fbe45STzanio     const mfem::FiniteElement *fe = fes->GetFE(0);
154*182fbe45STzanio     const int order = fes->GetOrder(0);
155*182fbe45STzanio     mfem::Array<int> dof_map;
156*182fbe45STzanio     switch (mesh->Dimension()) {
157*182fbe45STzanio     case 1: {
158*182fbe45STzanio       const mfem::H1_SegmentElement *h1_fe =
159*182fbe45STzanio         dynamic_cast<const mfem::H1_SegmentElement*>(fe);
160*182fbe45STzanio       MFEM_VERIFY(h1_fe, "invalid FE");
161*182fbe45STzanio       h1_fe->GetDofMap().Copy(dof_map);
162*182fbe45STzanio       break;
163*182fbe45STzanio     }
164*182fbe45STzanio     case 2: {
165*182fbe45STzanio       const mfem::H1_QuadrilateralElement *h1_fe =
166*182fbe45STzanio         dynamic_cast<const mfem::H1_QuadrilateralElement*>(fe);
167*182fbe45STzanio       MFEM_VERIFY(h1_fe, "invalid FE");
168*182fbe45STzanio       h1_fe->GetDofMap().Copy(dof_map);
169*182fbe45STzanio       break;
170*182fbe45STzanio     }
171*182fbe45STzanio     case 3: {
172*182fbe45STzanio       const mfem::H1_HexahedronElement *h1_fe =
173*182fbe45STzanio         dynamic_cast<const mfem::H1_HexahedronElement*>(fe);
174*182fbe45STzanio       MFEM_VERIFY(h1_fe, "invalid FE");
175*182fbe45STzanio       h1_fe->GetDofMap().Copy(dof_map);
176*182fbe45STzanio       break;
177*182fbe45STzanio     }
178*182fbe45STzanio     }
179*182fbe45STzanio     const mfem::FiniteElement *fe1d =
180*182fbe45STzanio       fes->FEColl()->FiniteElementForGeometry(mfem::Geometry::SEGMENT);
181*182fbe45STzanio     mfem::DenseMatrix shape1d(fe1d->GetDof(), ir.GetNPoints());
182*182fbe45STzanio     mfem::DenseMatrix grad1d(fe1d->GetDof(), ir.GetNPoints());
183*182fbe45STzanio     mfem::Vector qref1d(ir.GetNPoints()), qweight1d(ir.GetNPoints());
184*182fbe45STzanio     mfem::Vector shape_i(shape1d.Height());
185*182fbe45STzanio     mfem::DenseMatrix grad_i(grad1d.Height(), 1);
186*182fbe45STzanio     const mfem::H1_SegmentElement *h1_fe1d =
187*182fbe45STzanio       dynamic_cast<const mfem::H1_SegmentElement*>(fe1d);
188*182fbe45STzanio     MFEM_VERIFY(h1_fe1d, "invalid FE");
189*182fbe45STzanio     const mfem::Array<int> &dof_map_1d = h1_fe1d->GetDofMap();
190*182fbe45STzanio     for (int i = 0; i < ir.GetNPoints(); i++) {
191*182fbe45STzanio       const mfem::IntegrationPoint &ip = ir.IntPoint(i);
192*182fbe45STzanio       qref1d(i) = ip.x;
193*182fbe45STzanio       qweight1d(i) = ip.weight;
194*182fbe45STzanio       fe1d->CalcShape(ip, shape_i);
195*182fbe45STzanio       fe1d->CalcDShape(ip, grad_i);
196*182fbe45STzanio       for (int j = 0; j < shape1d.Height(); j++) {
197*182fbe45STzanio         shape1d(j,i) = shape_i(dof_map_1d[j]);
198*182fbe45STzanio         grad1d(j,i) = grad_i(dof_map_1d[j],0);
199*182fbe45STzanio       }
200*182fbe45STzanio     }
201*182fbe45STzanio     CeedBasisCreateTensorH1(ceed, mesh->Dimension(), fes->GetVDim(), order+1,
202*182fbe45STzanio                             ir.GetNPoints(), shape1d.GetData(),
203*182fbe45STzanio                             grad1d.GetData(), qref1d.GetData(),
204*182fbe45STzanio                             qweight1d.GetData(), basis);
205*182fbe45STzanio 
206*182fbe45STzanio     const mfem::Table &el_dof = fes->GetElementToDofTable();
207*182fbe45STzanio     mfem::Array<int> tp_el_dof(el_dof.Size_of_connections());
208*182fbe45STzanio     for (int i = 0; i < mesh->GetNE(); i++) {
209*182fbe45STzanio       const int el_offset = fe->GetDof()*i;
210*182fbe45STzanio       for (int j = 0; j < fe->GetDof(); j++) {
211*182fbe45STzanio         tp_el_dof[j + el_offset] = el_dof.GetJ()[dof_map[j] + el_offset];
212*182fbe45STzanio       }
213*182fbe45STzanio     }
214*182fbe45STzanio     CeedElemRestrictionCreate(ceed, mesh->GetNE(), fe->GetDof(),
215*182fbe45STzanio                               fes->GetNDofs(), CEED_MEM_HOST, CEED_COPY_VALUES,
216*182fbe45STzanio                               tp_el_dof.GetData(), restr);
217*182fbe45STzanio   }
218*182fbe45STzanio 
219*182fbe45STzanio  public:
220*182fbe45STzanio   /// Constructor. Assumes @a fes is a scalar FE space.
221*182fbe45STzanio   CeedDiffusionOperator(Ceed ceed, const mfem::FiniteElementSpace *fes)
222*182fbe45STzanio     : Operator(fes->GetNDofs()),
223*182fbe45STzanio       fes(fes) {
224*182fbe45STzanio     mfem::Mesh *mesh = fes->GetMesh();
225*182fbe45STzanio     const int order = fes->GetOrder(0);
226*182fbe45STzanio     const int ir_order = 2*(order + 2) - 1; // <-----
227*182fbe45STzanio     const mfem::IntegrationRule &ir =
228*182fbe45STzanio       mfem::IntRules.Get(mfem::Geometry::SEGMENT, ir_order);
229*182fbe45STzanio 
230*182fbe45STzanio     FESpace2Ceed(fes, ir, ceed, &basis, &restr);
231*182fbe45STzanio 
232*182fbe45STzanio     const mfem::FiniteElementSpace *mesh_fes = mesh->GetNodalFESpace();
233*182fbe45STzanio     MFEM_VERIFY(mesh_fes, "the Mesh has no nodal FE space");
234*182fbe45STzanio     FESpace2Ceed(mesh_fes, ir, ceed, &mesh_basis, &mesh_restr);
235*182fbe45STzanio 
236*182fbe45STzanio     CeedVectorCreate(ceed, mesh->GetNodes()->Size(), &node_coords);
237*182fbe45STzanio     CeedVectorSetArray(node_coords, CEED_MEM_HOST, CEED_USE_POINTER,
238*182fbe45STzanio                        mesh->GetNodes()->GetData());
239*182fbe45STzanio 
240*182fbe45STzanio     const int dim = mesh->Dimension();
241*182fbe45STzanio     diff_ctx.dim = dim;
242*182fbe45STzanio     diff_ctx.space_dim = mesh->SpaceDimension();
243*182fbe45STzanio 
244*182fbe45STzanio     const int qsize = dim*(dim+1)/2;
245*182fbe45STzanio     CeedQFunctionCreateInterior(ceed, 1, 1, qsize*sizeof(CeedScalar),
246*182fbe45STzanio                                 (CeedEvalMode)(CEED_EVAL_GRAD|CEED_EVAL_WEIGHT),
247*182fbe45STzanio                                 CEED_EVAL_NONE, f_build_diff,
248*182fbe45STzanio                                 __FILE__":f_build_diff", &build_qfunc);
249*182fbe45STzanio     CeedQFunctionSetContext(build_qfunc, &diff_ctx, sizeof(diff_ctx));
250*182fbe45STzanio     CeedOperatorCreate(ceed, mesh_restr, mesh_basis, build_qfunc, NULL, NULL,
251*182fbe45STzanio                        &build_oper);
252*182fbe45STzanio     CeedOperatorGetQData(build_oper, &qdata);
253*182fbe45STzanio     CeedOperatorApply(build_oper, qdata, node_coords, NULL,
254*182fbe45STzanio                       CEED_REQUEST_IMMEDIATE);
255*182fbe45STzanio 
256*182fbe45STzanio     CeedQFunctionCreateInterior(ceed, 1, 1, qsize*sizeof(CeedScalar),
257*182fbe45STzanio                                 CEED_EVAL_GRAD, CEED_EVAL_GRAD, f_apply_diff,
258*182fbe45STzanio                                 __FILE__":f_apply_diff", &apply_qfunc);
259*182fbe45STzanio     CeedQFunctionSetContext(apply_qfunc, &diff_ctx, sizeof(diff_ctx));
260*182fbe45STzanio     CeedOperatorCreate(ceed, restr, basis, apply_qfunc, NULL, NULL, &oper);
261*182fbe45STzanio 
262*182fbe45STzanio     CeedVectorCreate(ceed, fes->GetNDofs(), &u);
263*182fbe45STzanio     CeedVectorCreate(ceed, fes->GetNDofs(), &v);
264*182fbe45STzanio   }
265*182fbe45STzanio 
266*182fbe45STzanio   /// Destructor
267*182fbe45STzanio   ~CeedDiffusionOperator() {
268*182fbe45STzanio     CeedVectorDestroy(&v);
269*182fbe45STzanio     CeedVectorDestroy(&u);
270*182fbe45STzanio     CeedOperatorDestroy(&oper);
271*182fbe45STzanio     CeedQFunctionDestroy(&apply_qfunc);
272*182fbe45STzanio     // qdata is owned by build_oper
273*182fbe45STzanio     CeedOperatorDestroy(&build_oper);
274*182fbe45STzanio     CeedQFunctionDestroy(&build_qfunc);
275*182fbe45STzanio     CeedVectorDestroy(&node_coords);
276*182fbe45STzanio     CeedElemRestrictionDestroy(&mesh_restr);
277*182fbe45STzanio     CeedBasisDestroy(&mesh_basis);
278*182fbe45STzanio     CeedElemRestrictionDestroy(&restr);
279*182fbe45STzanio     CeedBasisDestroy(&basis);
280*182fbe45STzanio   }
281*182fbe45STzanio 
282*182fbe45STzanio   /// Operator action
283*182fbe45STzanio   virtual void Mult(const mfem::Vector &x, mfem::Vector &y) const {
284*182fbe45STzanio     CeedVectorSetArray(u, CEED_MEM_HOST, CEED_USE_POINTER, x.GetData());
285*182fbe45STzanio     CeedVectorSetArray(v, CEED_MEM_HOST, CEED_USE_POINTER, y.GetData());
286*182fbe45STzanio 
287*182fbe45STzanio     CeedOperatorApply(oper, qdata, u, v, CEED_REQUEST_IMMEDIATE);
288*182fbe45STzanio   }
289*182fbe45STzanio };
290