1*182fbe45STzanio // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at 2*182fbe45STzanio // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights 3*182fbe45STzanio // reserved. See files LICENSE and NOTICE for details. 4*182fbe45STzanio // 5*182fbe45STzanio // This file is part of CEED, a collection of benchmarks, miniapps, software 6*182fbe45STzanio // libraries and APIs for efficient high-order finite element and spectral 7*182fbe45STzanio // element discretizations for exascale applications. For more information and 8*182fbe45STzanio // source code availability see http://github.com/ceed. 9*182fbe45STzanio // 10*182fbe45STzanio // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11*182fbe45STzanio // a collaborative effort of two U.S. Department of Energy organizations (Office 12*182fbe45STzanio // of Science and the National Nuclear Security Administration) responsible for 13*182fbe45STzanio // the planning and preparation of a capable exascale ecosystem, including 14*182fbe45STzanio // software, applications, hardware, advanced system engineering and early 15*182fbe45STzanio // testbed platforms, in support of the nation's exascale computing imperative. 16*182fbe45STzanio 17*182fbe45STzanio /// @file 18*182fbe45STzanio /// MFEM diffusion operator based on libCEED 19*182fbe45STzanio 20*182fbe45STzanio #include <ceed.h> 21*182fbe45STzanio #include <mfem.hpp> 22*182fbe45STzanio 23*182fbe45STzanio /// A structure used to pass additional data to f_build_diff and f_apply_diff 24*182fbe45STzanio struct DiffContext { CeedInt dim, space_dim; }; 25*182fbe45STzanio 26*182fbe45STzanio /// libCEED Q-function for building quadrature data for a diffusion operator 27*182fbe45STzanio static int f_build_diff(void *ctx, void *qdata, CeedInt Q, 28*182fbe45STzanio const CeedScalar *const *u, CeedScalar *const *v) { 29*182fbe45STzanio // u[1] is Jacobians, size (Q x nc x dim) with column-major layout 30*182fbe45STzanio // u[4] is quadrature weights, size (Q) 31*182fbe45STzanio // 32*182fbe45STzanio // At every quadrature point, compute qw/det(J).adj(J).adj(J)^T and store 33*182fbe45STzanio // the symmetric part of the result. 34*182fbe45STzanio DiffContext *dc = (DiffContext*)ctx; 35*182fbe45STzanio CeedScalar *qd = (CeedScalar*)qdata; 36*182fbe45STzanio const CeedScalar *J = u[1], *qw = u[4]; 37*182fbe45STzanio switch (dc->dim + 10*dc->space_dim) { 38*182fbe45STzanio case 11: 39*182fbe45STzanio for (CeedInt i=0; i<Q; i++) { 40*182fbe45STzanio qd[i] = qw[i] / J[i]; 41*182fbe45STzanio } 42*182fbe45STzanio break; 43*182fbe45STzanio case 22: 44*182fbe45STzanio for (CeedInt i=0; i<Q; i++) { 45*182fbe45STzanio // J: 0 2 qd: 0 1 adj(J): J22 -J12 46*182fbe45STzanio // 1 3 1 2 -J21 J11 47*182fbe45STzanio const CeedScalar J11 = J[i+Q*0]; 48*182fbe45STzanio const CeedScalar J21 = J[i+Q*1]; 49*182fbe45STzanio const CeedScalar J12 = J[i+Q*2]; 50*182fbe45STzanio const CeedScalar J22 = J[i+Q*3]; 51*182fbe45STzanio const CeedScalar w = qw[i] / (J11*J22 - J21*J12); 52*182fbe45STzanio qd[i+Q*0] = w * (J12*J12 + J22*J22); 53*182fbe45STzanio qd[i+Q*1] = - w * (J11*J12 + J21*J22); 54*182fbe45STzanio qd[i+Q*2] = w * (J11*J11 + J21*J21); 55*182fbe45STzanio } 56*182fbe45STzanio break; 57*182fbe45STzanio case 33: 58*182fbe45STzanio for (CeedInt i=0; i<Q; i++) { 59*182fbe45STzanio // J: 0 3 6 qd: 0 1 2 60*182fbe45STzanio // 1 4 7 1 3 4 61*182fbe45STzanio // 2 5 8 2 4 5 62*182fbe45STzanio const CeedScalar J11 = J[i+Q*0]; 63*182fbe45STzanio const CeedScalar J21 = J[i+Q*1]; 64*182fbe45STzanio const CeedScalar J31 = J[i+Q*2]; 65*182fbe45STzanio const CeedScalar J12 = J[i+Q*3]; 66*182fbe45STzanio const CeedScalar J22 = J[i+Q*4]; 67*182fbe45STzanio const CeedScalar J32 = J[i+Q*5]; 68*182fbe45STzanio const CeedScalar J13 = J[i+Q*6]; 69*182fbe45STzanio const CeedScalar J23 = J[i+Q*7]; 70*182fbe45STzanio const CeedScalar J33 = J[i+Q*8]; 71*182fbe45STzanio const CeedScalar A11 = J22*J33 - J23*J32; 72*182fbe45STzanio const CeedScalar A12 = J13*J32 - J12*J33; 73*182fbe45STzanio const CeedScalar A13 = J12*J23 - J13*J22; 74*182fbe45STzanio const CeedScalar A21 = J23*J31 - J21*J33; 75*182fbe45STzanio const CeedScalar A22 = J11*J33 - J13*J31; 76*182fbe45STzanio const CeedScalar A23 = J13*J21 - J11*J23; 77*182fbe45STzanio const CeedScalar A31 = J21*J32 - J22*J31; 78*182fbe45STzanio const CeedScalar A32 = J12*J31 - J11*J32; 79*182fbe45STzanio const CeedScalar A33 = J11*J22 - J12*J21; 80*182fbe45STzanio const CeedScalar w = qw[i] / (J11*A11 + J21*A12 + J31*A13); 81*182fbe45STzanio qd[i+Q*0] = w * (A11*A11 + A12*A12 + A13*A13); 82*182fbe45STzanio qd[i+Q*1] = w * (A11*A21 + A12*A22 + A13*A23); 83*182fbe45STzanio qd[i+Q*2] = w * (A11*A31 + A12*A32 + A13*A33); 84*182fbe45STzanio qd[i+Q*3] = w * (A21*A21 + A22*A22 + A23*A23); 85*182fbe45STzanio qd[i+Q*4] = w * (A21*A31 + A22*A32 + A23*A33); 86*182fbe45STzanio qd[i+Q*5] = w * (A31*A31 + A32*A32 + A33*A33); 87*182fbe45STzanio } 88*182fbe45STzanio break; 89*182fbe45STzanio default: 90*182fbe45STzanio return CeedError(NULL, 1, "dim=%d, space_dim=%d is not supported", 91*182fbe45STzanio dc->dim, dc->space_dim); 92*182fbe45STzanio } 93*182fbe45STzanio return 0; 94*182fbe45STzanio } 95*182fbe45STzanio 96*182fbe45STzanio /// libCEED Q-function for applying a diff operator 97*182fbe45STzanio static int f_apply_diff(void *ctx, void *qdata, CeedInt Q, 98*182fbe45STzanio const CeedScalar *const *u, CeedScalar *const *v) { 99*182fbe45STzanio DiffContext *dc = (DiffContext*)ctx; 100*182fbe45STzanio const CeedScalar *qd = (const CeedScalar*)qdata; 101*182fbe45STzanio // u[1], v[1]: size: (Q x nc x dim) with column-major layout (nc == 1) 102*182fbe45STzanio const CeedScalar *ug = u[1]; 103*182fbe45STzanio CeedScalar *vg = v[1]; 104*182fbe45STzanio switch (dc->dim) { 105*182fbe45STzanio case 1: 106*182fbe45STzanio for (CeedInt i=0; i<Q; i++) { 107*182fbe45STzanio vg[i] = ug[i] * qd[i]; 108*182fbe45STzanio } 109*182fbe45STzanio break; 110*182fbe45STzanio case 2: 111*182fbe45STzanio for (CeedInt i=0; i<Q; i++) { 112*182fbe45STzanio const CeedScalar ug0 = ug[i+Q*0]; 113*182fbe45STzanio const CeedScalar ug1 = ug[i+Q*1]; 114*182fbe45STzanio vg[i+Q*0] = qd[i+Q*0]*ug0 + qd[i+Q*1]*ug1; 115*182fbe45STzanio vg[i+Q*1] = qd[i+Q*1]*ug0 + qd[i+Q*2]*ug1; 116*182fbe45STzanio } 117*182fbe45STzanio break; 118*182fbe45STzanio case 3: 119*182fbe45STzanio for (CeedInt i=0; i<Q; i++) { 120*182fbe45STzanio const CeedScalar ug0 = ug[i+Q*0]; 121*182fbe45STzanio const CeedScalar ug1 = ug[i+Q*1]; 122*182fbe45STzanio const CeedScalar ug2 = ug[i+Q*2]; 123*182fbe45STzanio vg[i+Q*0] = qd[i+Q*0]*ug0 + qd[i+Q*1]*ug1 + qd[i+Q*2]*ug2; 124*182fbe45STzanio vg[i+Q*1] = qd[i+Q*1]*ug0 + qd[i+Q*3]*ug1 + qd[i+Q*4]*ug2; 125*182fbe45STzanio vg[i+Q*2] = qd[i+Q*2]*ug0 + qd[i+Q*4]*ug1 + qd[i+Q*5]*ug2; 126*182fbe45STzanio } 127*182fbe45STzanio break; 128*182fbe45STzanio default: 129*182fbe45STzanio return CeedError(NULL, 1, "topo_dim=%d is not supported", dc->dim); 130*182fbe45STzanio } 131*182fbe45STzanio return 0; 132*182fbe45STzanio } 133*182fbe45STzanio 134*182fbe45STzanio /// Wrapper for a diffusion CeedOperator as an mfem::Operator 135*182fbe45STzanio class CeedDiffusionOperator : public mfem::Operator { 136*182fbe45STzanio protected: 137*182fbe45STzanio const mfem::FiniteElementSpace *fes; 138*182fbe45STzanio CeedOperator build_oper, oper; 139*182fbe45STzanio CeedBasis basis, mesh_basis; 140*182fbe45STzanio CeedElemRestriction restr, mesh_restr; 141*182fbe45STzanio CeedQFunction apply_qfunc, build_qfunc; 142*182fbe45STzanio CeedVector node_coords, qdata; 143*182fbe45STzanio 144*182fbe45STzanio DiffContext diff_ctx; 145*182fbe45STzanio 146*182fbe45STzanio CeedVector u, v; 147*182fbe45STzanio 148*182fbe45STzanio static void FESpace2Ceed(const mfem::FiniteElementSpace *fes, 149*182fbe45STzanio const mfem::IntegrationRule &ir, 150*182fbe45STzanio Ceed ceed, CeedBasis *basis, 151*182fbe45STzanio CeedElemRestriction *restr) { 152*182fbe45STzanio mfem::Mesh *mesh = fes->GetMesh(); 153*182fbe45STzanio const mfem::FiniteElement *fe = fes->GetFE(0); 154*182fbe45STzanio const int order = fes->GetOrder(0); 155*182fbe45STzanio mfem::Array<int> dof_map; 156*182fbe45STzanio switch (mesh->Dimension()) { 157*182fbe45STzanio case 1: { 158*182fbe45STzanio const mfem::H1_SegmentElement *h1_fe = 159*182fbe45STzanio dynamic_cast<const mfem::H1_SegmentElement*>(fe); 160*182fbe45STzanio MFEM_VERIFY(h1_fe, "invalid FE"); 161*182fbe45STzanio h1_fe->GetDofMap().Copy(dof_map); 162*182fbe45STzanio break; 163*182fbe45STzanio } 164*182fbe45STzanio case 2: { 165*182fbe45STzanio const mfem::H1_QuadrilateralElement *h1_fe = 166*182fbe45STzanio dynamic_cast<const mfem::H1_QuadrilateralElement*>(fe); 167*182fbe45STzanio MFEM_VERIFY(h1_fe, "invalid FE"); 168*182fbe45STzanio h1_fe->GetDofMap().Copy(dof_map); 169*182fbe45STzanio break; 170*182fbe45STzanio } 171*182fbe45STzanio case 3: { 172*182fbe45STzanio const mfem::H1_HexahedronElement *h1_fe = 173*182fbe45STzanio dynamic_cast<const mfem::H1_HexahedronElement*>(fe); 174*182fbe45STzanio MFEM_VERIFY(h1_fe, "invalid FE"); 175*182fbe45STzanio h1_fe->GetDofMap().Copy(dof_map); 176*182fbe45STzanio break; 177*182fbe45STzanio } 178*182fbe45STzanio } 179*182fbe45STzanio const mfem::FiniteElement *fe1d = 180*182fbe45STzanio fes->FEColl()->FiniteElementForGeometry(mfem::Geometry::SEGMENT); 181*182fbe45STzanio mfem::DenseMatrix shape1d(fe1d->GetDof(), ir.GetNPoints()); 182*182fbe45STzanio mfem::DenseMatrix grad1d(fe1d->GetDof(), ir.GetNPoints()); 183*182fbe45STzanio mfem::Vector qref1d(ir.GetNPoints()), qweight1d(ir.GetNPoints()); 184*182fbe45STzanio mfem::Vector shape_i(shape1d.Height()); 185*182fbe45STzanio mfem::DenseMatrix grad_i(grad1d.Height(), 1); 186*182fbe45STzanio const mfem::H1_SegmentElement *h1_fe1d = 187*182fbe45STzanio dynamic_cast<const mfem::H1_SegmentElement*>(fe1d); 188*182fbe45STzanio MFEM_VERIFY(h1_fe1d, "invalid FE"); 189*182fbe45STzanio const mfem::Array<int> &dof_map_1d = h1_fe1d->GetDofMap(); 190*182fbe45STzanio for (int i = 0; i < ir.GetNPoints(); i++) { 191*182fbe45STzanio const mfem::IntegrationPoint &ip = ir.IntPoint(i); 192*182fbe45STzanio qref1d(i) = ip.x; 193*182fbe45STzanio qweight1d(i) = ip.weight; 194*182fbe45STzanio fe1d->CalcShape(ip, shape_i); 195*182fbe45STzanio fe1d->CalcDShape(ip, grad_i); 196*182fbe45STzanio for (int j = 0; j < shape1d.Height(); j++) { 197*182fbe45STzanio shape1d(j,i) = shape_i(dof_map_1d[j]); 198*182fbe45STzanio grad1d(j,i) = grad_i(dof_map_1d[j],0); 199*182fbe45STzanio } 200*182fbe45STzanio } 201*182fbe45STzanio CeedBasisCreateTensorH1(ceed, mesh->Dimension(), fes->GetVDim(), order+1, 202*182fbe45STzanio ir.GetNPoints(), shape1d.GetData(), 203*182fbe45STzanio grad1d.GetData(), qref1d.GetData(), 204*182fbe45STzanio qweight1d.GetData(), basis); 205*182fbe45STzanio 206*182fbe45STzanio const mfem::Table &el_dof = fes->GetElementToDofTable(); 207*182fbe45STzanio mfem::Array<int> tp_el_dof(el_dof.Size_of_connections()); 208*182fbe45STzanio for (int i = 0; i < mesh->GetNE(); i++) { 209*182fbe45STzanio const int el_offset = fe->GetDof()*i; 210*182fbe45STzanio for (int j = 0; j < fe->GetDof(); j++) { 211*182fbe45STzanio tp_el_dof[j + el_offset] = el_dof.GetJ()[dof_map[j] + el_offset]; 212*182fbe45STzanio } 213*182fbe45STzanio } 214*182fbe45STzanio CeedElemRestrictionCreate(ceed, mesh->GetNE(), fe->GetDof(), 215*182fbe45STzanio fes->GetNDofs(), CEED_MEM_HOST, CEED_COPY_VALUES, 216*182fbe45STzanio tp_el_dof.GetData(), restr); 217*182fbe45STzanio } 218*182fbe45STzanio 219*182fbe45STzanio public: 220*182fbe45STzanio /// Constructor. Assumes @a fes is a scalar FE space. 221*182fbe45STzanio CeedDiffusionOperator(Ceed ceed, const mfem::FiniteElementSpace *fes) 222*182fbe45STzanio : Operator(fes->GetNDofs()), 223*182fbe45STzanio fes(fes) { 224*182fbe45STzanio mfem::Mesh *mesh = fes->GetMesh(); 225*182fbe45STzanio const int order = fes->GetOrder(0); 226*182fbe45STzanio const int ir_order = 2*(order + 2) - 1; // <----- 227*182fbe45STzanio const mfem::IntegrationRule &ir = 228*182fbe45STzanio mfem::IntRules.Get(mfem::Geometry::SEGMENT, ir_order); 229*182fbe45STzanio 230*182fbe45STzanio FESpace2Ceed(fes, ir, ceed, &basis, &restr); 231*182fbe45STzanio 232*182fbe45STzanio const mfem::FiniteElementSpace *mesh_fes = mesh->GetNodalFESpace(); 233*182fbe45STzanio MFEM_VERIFY(mesh_fes, "the Mesh has no nodal FE space"); 234*182fbe45STzanio FESpace2Ceed(mesh_fes, ir, ceed, &mesh_basis, &mesh_restr); 235*182fbe45STzanio 236*182fbe45STzanio CeedVectorCreate(ceed, mesh->GetNodes()->Size(), &node_coords); 237*182fbe45STzanio CeedVectorSetArray(node_coords, CEED_MEM_HOST, CEED_USE_POINTER, 238*182fbe45STzanio mesh->GetNodes()->GetData()); 239*182fbe45STzanio 240*182fbe45STzanio const int dim = mesh->Dimension(); 241*182fbe45STzanio diff_ctx.dim = dim; 242*182fbe45STzanio diff_ctx.space_dim = mesh->SpaceDimension(); 243*182fbe45STzanio 244*182fbe45STzanio const int qsize = dim*(dim+1)/2; 245*182fbe45STzanio CeedQFunctionCreateInterior(ceed, 1, 1, qsize*sizeof(CeedScalar), 246*182fbe45STzanio (CeedEvalMode)(CEED_EVAL_GRAD|CEED_EVAL_WEIGHT), 247*182fbe45STzanio CEED_EVAL_NONE, f_build_diff, 248*182fbe45STzanio __FILE__":f_build_diff", &build_qfunc); 249*182fbe45STzanio CeedQFunctionSetContext(build_qfunc, &diff_ctx, sizeof(diff_ctx)); 250*182fbe45STzanio CeedOperatorCreate(ceed, mesh_restr, mesh_basis, build_qfunc, NULL, NULL, 251*182fbe45STzanio &build_oper); 252*182fbe45STzanio CeedOperatorGetQData(build_oper, &qdata); 253*182fbe45STzanio CeedOperatorApply(build_oper, qdata, node_coords, NULL, 254*182fbe45STzanio CEED_REQUEST_IMMEDIATE); 255*182fbe45STzanio 256*182fbe45STzanio CeedQFunctionCreateInterior(ceed, 1, 1, qsize*sizeof(CeedScalar), 257*182fbe45STzanio CEED_EVAL_GRAD, CEED_EVAL_GRAD, f_apply_diff, 258*182fbe45STzanio __FILE__":f_apply_diff", &apply_qfunc); 259*182fbe45STzanio CeedQFunctionSetContext(apply_qfunc, &diff_ctx, sizeof(diff_ctx)); 260*182fbe45STzanio CeedOperatorCreate(ceed, restr, basis, apply_qfunc, NULL, NULL, &oper); 261*182fbe45STzanio 262*182fbe45STzanio CeedVectorCreate(ceed, fes->GetNDofs(), &u); 263*182fbe45STzanio CeedVectorCreate(ceed, fes->GetNDofs(), &v); 264*182fbe45STzanio } 265*182fbe45STzanio 266*182fbe45STzanio /// Destructor 267*182fbe45STzanio ~CeedDiffusionOperator() { 268*182fbe45STzanio CeedVectorDestroy(&v); 269*182fbe45STzanio CeedVectorDestroy(&u); 270*182fbe45STzanio CeedOperatorDestroy(&oper); 271*182fbe45STzanio CeedQFunctionDestroy(&apply_qfunc); 272*182fbe45STzanio // qdata is owned by build_oper 273*182fbe45STzanio CeedOperatorDestroy(&build_oper); 274*182fbe45STzanio CeedQFunctionDestroy(&build_qfunc); 275*182fbe45STzanio CeedVectorDestroy(&node_coords); 276*182fbe45STzanio CeedElemRestrictionDestroy(&mesh_restr); 277*182fbe45STzanio CeedBasisDestroy(&mesh_basis); 278*182fbe45STzanio CeedElemRestrictionDestroy(&restr); 279*182fbe45STzanio CeedBasisDestroy(&basis); 280*182fbe45STzanio } 281*182fbe45STzanio 282*182fbe45STzanio /// Operator action 283*182fbe45STzanio virtual void Mult(const mfem::Vector &x, mfem::Vector &y) const { 284*182fbe45STzanio CeedVectorSetArray(u, CEED_MEM_HOST, CEED_USE_POINTER, x.GetData()); 285*182fbe45STzanio CeedVectorSetArray(v, CEED_MEM_HOST, CEED_USE_POINTER, y.GetData()); 286*182fbe45STzanio 287*182fbe45STzanio CeedOperatorApply(oper, qdata, u, v, CEED_REQUEST_IMMEDIATE); 288*182fbe45STzanio } 289*182fbe45STzanio }; 290