1*4d537eeaSYohann // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. 2*4d537eeaSYohann // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. 3*4d537eeaSYohann // All Rights reserved. See files LICENSE and NOTICE for details. 4*4d537eeaSYohann // 5*4d537eeaSYohann // This file is part of CEED, a collection of benchmarks, miniapps, software 6*4d537eeaSYohann // libraries and APIs for efficient high-order finite element and spectral 7*4d537eeaSYohann // element discretizations for exascale applications. For more information and 8*4d537eeaSYohann // source code availability see http://github.com/ceed. 9*4d537eeaSYohann // 10*4d537eeaSYohann // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11*4d537eeaSYohann // a collaborative effort of two U.S. Department of Energy organizations (Office 12*4d537eeaSYohann // of Science and the National Nuclear Security Administration) responsible for 13*4d537eeaSYohann // the planning and preparation of a capable exascale ecosystem, including 14*4d537eeaSYohann // software, applications, hardware, advanced system engineering and early 15*4d537eeaSYohann // testbed platforms, in support of the nation's exascale computing imperative. 16*4d537eeaSYohann 17*4d537eeaSYohann 18*4d537eeaSYohann /// A structure used to pass additional data to f_build_diff and f_apply_diff 19*4d537eeaSYohann struct BuildContext { CeedInt dim, space_dim; }; 20*4d537eeaSYohann 21*4d537eeaSYohann /// libCEED Q-function for building quadrature data for a diffusion operator 22*4d537eeaSYohann CEED_QFUNCTION(f_build_diff)(void *ctx, const CeedInt Q, 23*4d537eeaSYohann const CeedScalar *const *in, CeedScalar *const *out) { 24*4d537eeaSYohann BuildContext *bc = (BuildContext *)ctx; 25*4d537eeaSYohann // in[0] is Jacobians with shape [dim, nc=dim, Q] 26*4d537eeaSYohann // in[1] is quadrature weights, size (Q) 27*4d537eeaSYohann // 28*4d537eeaSYohann // At every quadrature point, compute qw/det(J).adj(J).adj(J)^T and store 29*4d537eeaSYohann // the symmetric part of the result. 30*4d537eeaSYohann const CeedScalar *J = in[0], *qw = in[1]; 31*4d537eeaSYohann CeedScalar *qd = out[0]; 32*4d537eeaSYohann switch (bc->dim + 10*bc->space_dim) { 33*4d537eeaSYohann case 11: 34*4d537eeaSYohann for (CeedInt i=0; i<Q; i++) { 35*4d537eeaSYohann qd[i] = qw[i] / J[i]; 36*4d537eeaSYohann } 37*4d537eeaSYohann break; 38*4d537eeaSYohann case 22: 39*4d537eeaSYohann for (CeedInt i=0; i<Q; i++) { 40*4d537eeaSYohann // J: 0 2 qd: 0 1 adj(J): J22 -J12 41*4d537eeaSYohann // 1 3 1 2 -J21 J11 42*4d537eeaSYohann const CeedScalar J11 = J[i+Q*0]; 43*4d537eeaSYohann const CeedScalar J21 = J[i+Q*1]; 44*4d537eeaSYohann const CeedScalar J12 = J[i+Q*2]; 45*4d537eeaSYohann const CeedScalar J22 = J[i+Q*3]; 46*4d537eeaSYohann const CeedScalar w = qw[i] / (J11*J22 - J21*J12); 47*4d537eeaSYohann qd[i+Q*0] = w * (J12*J12 + J22*J22); 48*4d537eeaSYohann qd[i+Q*1] = - w * (J11*J12 + J21*J22); 49*4d537eeaSYohann qd[i+Q*2] = w * (J11*J11 + J21*J21); 50*4d537eeaSYohann } 51*4d537eeaSYohann break; 52*4d537eeaSYohann case 33: 53*4d537eeaSYohann for (CeedInt i=0; i<Q; i++) { 54*4d537eeaSYohann // J: 0 3 6 qd: 0 1 2 55*4d537eeaSYohann // 1 4 7 1 3 4 56*4d537eeaSYohann // 2 5 8 2 4 5 57*4d537eeaSYohann const CeedScalar J11 = J[i+Q*0]; 58*4d537eeaSYohann const CeedScalar J21 = J[i+Q*1]; 59*4d537eeaSYohann const CeedScalar J31 = J[i+Q*2]; 60*4d537eeaSYohann const CeedScalar J12 = J[i+Q*3]; 61*4d537eeaSYohann const CeedScalar J22 = J[i+Q*4]; 62*4d537eeaSYohann const CeedScalar J32 = J[i+Q*5]; 63*4d537eeaSYohann const CeedScalar J13 = J[i+Q*6]; 64*4d537eeaSYohann const CeedScalar J23 = J[i+Q*7]; 65*4d537eeaSYohann const CeedScalar J33 = J[i+Q*8]; 66*4d537eeaSYohann const CeedScalar A11 = J22*J33 - J23*J32; 67*4d537eeaSYohann const CeedScalar A12 = J13*J32 - J12*J33; 68*4d537eeaSYohann const CeedScalar A13 = J12*J23 - J13*J22; 69*4d537eeaSYohann const CeedScalar A21 = J23*J31 - J21*J33; 70*4d537eeaSYohann const CeedScalar A22 = J11*J33 - J13*J31; 71*4d537eeaSYohann const CeedScalar A23 = J13*J21 - J11*J23; 72*4d537eeaSYohann const CeedScalar A31 = J21*J32 - J22*J31; 73*4d537eeaSYohann const CeedScalar A32 = J12*J31 - J11*J32; 74*4d537eeaSYohann const CeedScalar A33 = J11*J22 - J12*J21; 75*4d537eeaSYohann const CeedScalar w = qw[i] / (J11*A11 + J21*A12 + J31*A13); 76*4d537eeaSYohann qd[i+Q*0] = w * (A11*A11 + A12*A12 + A13*A13); 77*4d537eeaSYohann qd[i+Q*1] = w * (A11*A21 + A12*A22 + A13*A23); 78*4d537eeaSYohann qd[i+Q*2] = w * (A11*A31 + A12*A32 + A13*A33); 79*4d537eeaSYohann qd[i+Q*3] = w * (A21*A21 + A22*A22 + A23*A23); 80*4d537eeaSYohann qd[i+Q*4] = w * (A21*A31 + A22*A32 + A23*A33); 81*4d537eeaSYohann qd[i+Q*5] = w * (A31*A31 + A32*A32 + A33*A33); 82*4d537eeaSYohann } 83*4d537eeaSYohann break; 84*4d537eeaSYohann } 85*4d537eeaSYohann return 0; 86*4d537eeaSYohann } 87*4d537eeaSYohann 88*4d537eeaSYohann /// libCEED Q-function for applying a diff operator 89*4d537eeaSYohann CEED_QFUNCTION(f_apply_diff)(void *ctx, const CeedInt Q, 90*4d537eeaSYohann const CeedScalar *const *in, CeedScalar *const *out) { 91*4d537eeaSYohann BuildContext *bc = (BuildContext *)ctx; 92*4d537eeaSYohann // in[0], out[0] have shape [dim, nc=1, Q] 93*4d537eeaSYohann const CeedScalar *ug = in[0], *qd = in[1]; 94*4d537eeaSYohann CeedScalar *vg = out[0]; 95*4d537eeaSYohann switch (bc->dim) { 96*4d537eeaSYohann case 1: 97*4d537eeaSYohann for (CeedInt i=0; i<Q; i++) { 98*4d537eeaSYohann vg[i] = ug[i] * qd[i]; 99*4d537eeaSYohann } 100*4d537eeaSYohann break; 101*4d537eeaSYohann case 2: 102*4d537eeaSYohann for (CeedInt i=0; i<Q; i++) { 103*4d537eeaSYohann const CeedScalar ug0 = ug[i+Q*0]; 104*4d537eeaSYohann const CeedScalar ug1 = ug[i+Q*1]; 105*4d537eeaSYohann vg[i+Q*0] = qd[i+Q*0]*ug0 + qd[i+Q*1]*ug1; 106*4d537eeaSYohann vg[i+Q*1] = qd[i+Q*1]*ug0 + qd[i+Q*2]*ug1; 107*4d537eeaSYohann } 108*4d537eeaSYohann break; 109*4d537eeaSYohann case 3: 110*4d537eeaSYohann for (CeedInt i=0; i<Q; i++) { 111*4d537eeaSYohann const CeedScalar ug0 = ug[i+Q*0]; 112*4d537eeaSYohann const CeedScalar ug1 = ug[i+Q*1]; 113*4d537eeaSYohann const CeedScalar ug2 = ug[i+Q*2]; 114*4d537eeaSYohann vg[i+Q*0] = qd[i+Q*0]*ug0 + qd[i+Q*1]*ug1 + qd[i+Q*2]*ug2; 115*4d537eeaSYohann vg[i+Q*1] = qd[i+Q*1]*ug0 + qd[i+Q*3]*ug1 + qd[i+Q*4]*ug2; 116*4d537eeaSYohann vg[i+Q*2] = qd[i+Q*2]*ug0 + qd[i+Q*4]*ug1 + qd[i+Q*5]*ug2; 117*4d537eeaSYohann } 118*4d537eeaSYohann break; 119*4d537eeaSYohann } 120*4d537eeaSYohann return 0; 121*4d537eeaSYohann } 122