xref: /libCEED/examples/nek/bps/bps.h (revision 36d2312c6a9f418dd1dc278db7b470a7527039c0)
14d537eeaSYohann // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
24d537eeaSYohann // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
34d537eeaSYohann // All Rights reserved. See files LICENSE and NOTICE for details.
44d537eeaSYohann //
54d537eeaSYohann // This file is part of CEED, a collection of benchmarks, miniapps, software
64d537eeaSYohann // libraries and APIs for efficient high-order finite element and spectral
74d537eeaSYohann // element discretizations for exascale applications. For more information and
84d537eeaSYohann // source code availability see http://github.com/ceed.
94d537eeaSYohann //
104d537eeaSYohann // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
114d537eeaSYohann // a collaborative effort of two U.S. Department of Energy organizations (Office
124d537eeaSYohann // of Science and the National Nuclear Security Administration) responsible for
134d537eeaSYohann // the planning and preparation of a capable exascale ecosystem, including
144d537eeaSYohann // software, applications, hardware, advanced system engineering and early
154d537eeaSYohann // testbed platforms, in support of the nation's exascale computing imperative.
164d537eeaSYohann 
17*36d2312cSvaleriabarra #ifndef bps_h
18*36d2312cSvaleriabarra #define bps_h
19*36d2312cSvaleriabarra #include <ceed.h>
20*36d2312cSvaleriabarra 
214d537eeaSYohann #ifndef __CUDACC__
224d537eeaSYohann #  include <math.h>
234d537eeaSYohann #endif
244d537eeaSYohann 
25ccaff030SJeremy L Thompson #ifndef M_PI
26ccaff030SJeremy L Thompson #define M_PI    3.14159265358979323846
27ccaff030SJeremy L Thompson #endif
28ccaff030SJeremy L Thompson 
294d537eeaSYohann // *****************************************************************************
304d537eeaSYohann //   BP 1
314d537eeaSYohann // *****************************************************************************
32ccaff030SJeremy L Thompson CEED_QFUNCTION(masssetupf)(void *ctx, CeedInt Q, const CeedScalar *const *in,
33ccaff030SJeremy L Thompson                            CeedScalar *const *out) {
34a2fa7910SValeria Barra   CeedScalar *qdata = out[0], *rhs = out[1];
354d537eeaSYohann   const CeedScalar *x = in[0];
364d537eeaSYohann   const CeedScalar *J = in[1];
374d537eeaSYohann   const CeedScalar *w = in[2];
38ee07ded2SValeria Barra 
39ee07ded2SValeria Barra   // Quadrature Point Loop
404d537eeaSYohann   for (CeedInt i=0; i<Q; i++) {
414d537eeaSYohann     CeedScalar det = (J[i+Q*0]*(J[i+Q*4]*J[i+Q*8] - J[i+Q*5]*J[i+Q*7]) -
424d537eeaSYohann                       J[i+Q*1]*(J[i+Q*3]*J[i+Q*8] - J[i+Q*5]*J[i+Q*6]) +
434d537eeaSYohann                       J[i+Q*2]*(J[i+Q*3]*J[i+Q*7] - J[i+Q*4]*J[i+Q*6]));
44a2fa7910SValeria Barra     qdata[i] = det * w[i];
45a2fa7910SValeria Barra     rhs[i] = qdata[i] * w[i] *
464d537eeaSYohann              sqrt(x[i]*x[i] + x[i+Q]*x[i+Q] + x[i+2*Q]*x[i+2*Q]);
47ee07ded2SValeria Barra   } // End of Quadrature Point Loop
484d537eeaSYohann   return 0;
494d537eeaSYohann }
504d537eeaSYohann 
51ccaff030SJeremy L Thompson CEED_QFUNCTION int massf(void *ctx, CeedInt Q, const CeedScalar *const *in,
52ccaff030SJeremy L Thompson                          CeedScalar *const *out) {
534d537eeaSYohann   const CeedScalar *u = in[0];
54a2fa7910SValeria Barra   const CeedScalar *qdata = in[1];
554d537eeaSYohann   CeedScalar *v = out[0];
56ee07ded2SValeria Barra 
57ee07ded2SValeria Barra   // Quadrature Point Loop
58ee07ded2SValeria Barra   for (CeedInt i=0; i<Q; i++)
59a2fa7910SValeria Barra     v[i] = qdata[i] * u[i];
60ee07ded2SValeria Barra 
614d537eeaSYohann   return 0;
624d537eeaSYohann }
634d537eeaSYohann // *****************************************************************************
644d537eeaSYohann //   BP 3
654d537eeaSYohann // *****************************************************************************
66ccaff030SJeremy L Thompson CEED_QFUNCTION(diffsetupf)(void *ctx, CeedInt Q, const CeedScalar *const *in,
67ccaff030SJeremy L Thompson                            CeedScalar *const *out) {
684d537eeaSYohann   const CeedScalar *x = in[0];
694d537eeaSYohann   const CeedScalar *J = in[1];
704d537eeaSYohann   const CeedScalar *w = in[2];
71a2fa7910SValeria Barra   CeedScalar *qdata = out[0], *rhs = out[1];
72ee07ded2SValeria Barra 
73ee07ded2SValeria Barra   // Quadrature Point Loop
744d537eeaSYohann   for (CeedInt i=0; i<Q; i++) {
75288c0443SJeremy L Thompson     // Stored in Voigt convention
76288c0443SJeremy L Thompson     // 0 5 4
77288c0443SJeremy L Thompson     // 5 1 3
78288c0443SJeremy L Thompson     // 4 3 2
794d537eeaSYohann     const CeedScalar J11 = J[i+Q*0];
804d537eeaSYohann     const CeedScalar J21 = J[i+Q*1];
814d537eeaSYohann     const CeedScalar J31 = J[i+Q*2];
824d537eeaSYohann     const CeedScalar J12 = J[i+Q*3];
834d537eeaSYohann     const CeedScalar J22 = J[i+Q*4];
844d537eeaSYohann     const CeedScalar J32 = J[i+Q*5];
854d537eeaSYohann     const CeedScalar J13 = J[i+Q*6];
864d537eeaSYohann     const CeedScalar J23 = J[i+Q*7];
874d537eeaSYohann     const CeedScalar J33 = J[i+Q*8];
884d537eeaSYohann     const CeedScalar A11 = J22*J33 - J23*J32;
894d537eeaSYohann     const CeedScalar A12 = J13*J32 - J12*J33;
904d537eeaSYohann     const CeedScalar A13 = J12*J23 - J13*J22;
914d537eeaSYohann     const CeedScalar A21 = J23*J31 - J21*J33;
924d537eeaSYohann     const CeedScalar A22 = J11*J33 - J13*J31;
934d537eeaSYohann     const CeedScalar A23 = J13*J21 - J11*J23;
944d537eeaSYohann     const CeedScalar A31 = J21*J32 - J22*J31;
954d537eeaSYohann     const CeedScalar A32 = J12*J31 - J11*J32;
964d537eeaSYohann     const CeedScalar A33 = J11*J22 - J12*J21;
974d537eeaSYohann     const CeedScalar qw = w[i] / (J11*A11 + J21*A12 + J31*A13);
98a2fa7910SValeria Barra     qdata[i+Q*0] = qw * (A11*A11 + A12*A12 + A13*A13);
99a2fa7910SValeria Barra     qdata[i+Q*1] = qw * (A21*A21 + A22*A22 + A23*A23);
100a2fa7910SValeria Barra     qdata[i+Q*2] = qw * (A31*A31 + A32*A32 + A33*A33);
101a2fa7910SValeria Barra     qdata[i+Q*3] = qw * (A21*A31 + A22*A32 + A23*A33);
102a2fa7910SValeria Barra     qdata[i+Q*4] = qw * (A11*A31 + A12*A32 + A13*A33);
103a2fa7910SValeria Barra     qdata[i+Q*5] = qw * (A11*A21 + A12*A22 + A13*A23);
1044d537eeaSYohann     const CeedScalar c[3] = { 0, 1., 2. };
1054d537eeaSYohann     const CeedScalar k[3] = { 1., 2., 3. };
1064d537eeaSYohann     const CeedScalar rho = w[i] * (J11*A11 + J21*A12 + J31*A13);
1074d537eeaSYohann     rhs[i] = rho * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) *
1084d537eeaSYohann              sin(M_PI*(c[0] + k[0]*x[i+Q*0])) *
1094d537eeaSYohann              sin(M_PI*(c[1] + k[1]*x[i+Q*1])) *
1104d537eeaSYohann              sin(M_PI*(c[2] + k[2]*x[i+Q*2]));
111ee07ded2SValeria Barra   } // End of Quadrature Point Loop
1124d537eeaSYohann   return 0;
1134d537eeaSYohann }
1144d537eeaSYohann 
115ccaff030SJeremy L Thompson CEED_QFUNCTION int diffusionf(void *ctx, CeedInt Q, const CeedScalar *const *in,
116ccaff030SJeremy L Thompson                               CeedScalar *const *out) {
1174d537eeaSYohann   const CeedScalar *ug = in[0];
118a2fa7910SValeria Barra   const CeedScalar *qdata = in[1];
1194d537eeaSYohann   CeedScalar *vg = out[0];
120ee07ded2SValeria Barra 
121ee07ded2SValeria Barra   // Quadrature Point Loop
1224d537eeaSYohann   for (CeedInt i=0; i<Q; i++) {
1234d537eeaSYohann     const CeedScalar ug0 = ug[i+Q*0];
1244d537eeaSYohann     const CeedScalar ug1 = ug[i+Q*1];
1254d537eeaSYohann     const CeedScalar ug2 = ug[i+Q*2];
126a2fa7910SValeria Barra     vg[i+Q*0] = qdata[i+Q*0]*ug0 + qdata[i+Q*5]*ug1 + qdata[i+Q*4]*ug2;
127a2fa7910SValeria Barra     vg[i+Q*1] = qdata[i+Q*5]*ug0 + qdata[i+Q*1]*ug1 + qdata[i+Q*3]*ug2;
128a2fa7910SValeria Barra     vg[i+Q*2] = qdata[i+Q*4]*ug0 + qdata[i+Q*3]*ug1 + qdata[i+Q*2]*ug2;
129ee07ded2SValeria Barra   } // End of Quadrature Point Loop
1304d537eeaSYohann   return 0;
1314d537eeaSYohann }
132*36d2312cSvaleriabarra 
133*36d2312cSvaleriabarra #endif // bps_h
134