xref: /libCEED/examples/petsc/qfunctions/bps/bp4.h (revision 9b072555b57804a6f4e0fc2b1ad83be89838f0e5)
1cb32e2e7SValeria Barra // Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
2cb32e2e7SValeria Barra // the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
3cb32e2e7SValeria Barra // reserved. See files LICENSE and NOTICE for details.
4cb32e2e7SValeria Barra //
5cb32e2e7SValeria Barra // This file is part of CEED, a collection of benchmarks, miniapps, software
6cb32e2e7SValeria Barra // libraries and APIs for efficient high-order finite element and spectral
7cb32e2e7SValeria Barra // element discretizations for exascale applications. For more information and
8cb32e2e7SValeria Barra // source code availability see http://github.com/ceed.
9cb32e2e7SValeria Barra //
10cb32e2e7SValeria Barra // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11cb32e2e7SValeria Barra // a collaborative effort of two U.S. Department of Energy organizations (Office
12cb32e2e7SValeria Barra // of Science and the National Nuclear Security Administration) responsible for
13cb32e2e7SValeria Barra // the planning and preparation of a capable exascale ecosystem, including
14cb32e2e7SValeria Barra // software, applications, hardware, advanced system engineering and early
15cb32e2e7SValeria Barra // testbed platforms, in support of the nation's exascale computing imperative.
16cb32e2e7SValeria Barra 
17cb32e2e7SValeria Barra /// @file
18cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc
19cb32e2e7SValeria Barra 
20f6b55d2cSvaleriabarra #ifndef bp4_h
21f6b55d2cSvaleriabarra #define bp4_h
22f6b55d2cSvaleriabarra 
23f6b55d2cSvaleriabarra #ifndef __CUDACC__
24f6b55d2cSvaleriabarra #  include <math.h>
25f6b55d2cSvaleriabarra #endif
26f6b55d2cSvaleriabarra 
27e83e87a5Sjeremylt // -----------------------------------------------------------------------------
2813921685Svaleriabarra // This QFunction sets up the rhs and true solution for the problem
29cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
30cb32e2e7SValeria Barra CEED_QFUNCTION(SetupDiffRhs3)(void *ctx, CeedInt Q,
31cb32e2e7SValeria Barra                               const CeedScalar *const *in,
32cb32e2e7SValeria Barra                               CeedScalar *const *out) {
33cb32e2e7SValeria Barra #ifndef M_PI
34cb32e2e7SValeria Barra #  define M_PI    3.14159265358979323846
35cb32e2e7SValeria Barra #endif
36e83e87a5Sjeremylt   const CeedScalar *x = in[0], *w = in[1];
37cb32e2e7SValeria Barra   CeedScalar *true_soln = out[0], *rhs = out[1];
38cb32e2e7SValeria Barra 
39cb32e2e7SValeria Barra   // Quadrature Point Loop
40cb32e2e7SValeria Barra   CeedPragmaSIMD
41cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
42cb32e2e7SValeria Barra     const CeedScalar c[3] = { 0, 1., 2. };
43cb32e2e7SValeria Barra     const CeedScalar k[3] = { 1., 2., 3. };
44cb32e2e7SValeria Barra 
45cb32e2e7SValeria Barra     // Component 1
46cb32e2e7SValeria Barra     true_soln[i+0*Q] = sin(M_PI*(c[0] + k[0]*x[i+Q*0])) *
47cb32e2e7SValeria Barra                        sin(M_PI*(c[1] + k[1]*x[i+Q*1])) *
48cb32e2e7SValeria Barra                        sin(M_PI*(c[2] + k[2]*x[i+Q*2]));
49cb32e2e7SValeria Barra     // Component 2
5082311801Sjeremylt     true_soln[i+1*Q] = 2 * true_soln[i+0*Q];
51cb32e2e7SValeria Barra     // Component 3
5282311801Sjeremylt     true_soln[i+2*Q] = 3 * true_soln[i+0*Q];
53cb32e2e7SValeria Barra 
54cb32e2e7SValeria Barra     // Component 1
55e83e87a5Sjeremylt     rhs[i+0*Q] = w[i+Q*6] * M_PI*M_PI * (k[0]*k[0] + k[1]*k[1] + k[2]*k[2]) *
56cb32e2e7SValeria Barra                  true_soln[i+0*Q];
57cb32e2e7SValeria Barra     // Component 2
5882311801Sjeremylt     rhs[i+1*Q] = 2 * rhs[i+0*Q];
59cb32e2e7SValeria Barra     // Component 3
6082311801Sjeremylt     rhs[i+2*Q] = 3 * rhs[i+0*Q];
61cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
62cb32e2e7SValeria Barra 
63cb32e2e7SValeria Barra   return 0;
64cb32e2e7SValeria Barra }
65cb32e2e7SValeria Barra 
66e83e87a5Sjeremylt // -----------------------------------------------------------------------------
67ed264d09SValeria Barra // This QFunction applies the diffusion operator for a vector field of 3 components.
68ed264d09SValeria Barra //
69ed264d09SValeria Barra // Inputs:
70ed264d09SValeria Barra //   ug     - Input vector Jacobian at quadrature points
71*9b072555Sjeremylt //   q_data  - Geometric factors
72ed264d09SValeria Barra //
73ed264d09SValeria Barra // Output:
74ed264d09SValeria Barra //   vJ     - Output vector (test functions) Jacobian at quadrature points
75ed264d09SValeria Barra //
76cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
77cb32e2e7SValeria Barra CEED_QFUNCTION(Diff3)(void *ctx, CeedInt Q,
78cb32e2e7SValeria Barra                      const CeedScalar *const *in, CeedScalar *const *out) {
79cb32e2e7SValeria Barra   const CeedScalar *ug = in[0], *qd = in[1];
80cb32e2e7SValeria Barra   CeedScalar *vg = out[0];
81cb32e2e7SValeria Barra 
82cb32e2e7SValeria Barra   // Quadrature Point Loop
83cb32e2e7SValeria Barra   CeedPragmaSIMD
84cb32e2e7SValeria Barra   for (CeedInt i=0; i<Q; i++) {
85cb32e2e7SValeria Barra     // Read spatial derivatives of u components
86cb32e2e7SValeria Barra     const CeedScalar uJ[3][3]         = {{ug[i+(0+0*3)*Q],
87cb32e2e7SValeria Barra                                           ug[i+(0+1*3)*Q],
88cb32e2e7SValeria Barra                                           ug[i+(0+2*3)*Q]},
89cb32e2e7SValeria Barra                                          {ug[i+(1+0*3)*Q],
90cb32e2e7SValeria Barra                                           ug[i+(1+1*3)*Q],
91cb32e2e7SValeria Barra                                           ug[i+(1+2*3)*Q]},
92cb32e2e7SValeria Barra                                          {ug[i+(2+0*3)*Q],
93cb32e2e7SValeria Barra                                           ug[i+(2+1*3)*Q],
94cb32e2e7SValeria Barra                                           ug[i+(2+2*3)*Q]}
95cb32e2e7SValeria Barra                                         };
96*9b072555Sjeremylt     // Read q_data (dXdxdXdx_T symmetric matrix)
97*9b072555Sjeremylt     const CeedScalar dXdxdXdx_T[3][3] = {{qd[i+0*Q],
98cb32e2e7SValeria Barra                                           qd[i+1*Q],
99cb32e2e7SValeria Barra                                           qd[i+2*Q]},
100cb32e2e7SValeria Barra                                          {qd[i+1*Q],
101cb32e2e7SValeria Barra                                           qd[i+3*Q],
102cb32e2e7SValeria Barra                                           qd[i+4*Q]},
103cb32e2e7SValeria Barra                                          {qd[i+2*Q],
104cb32e2e7SValeria Barra                                           qd[i+4*Q],
105cb32e2e7SValeria Barra                                           qd[i+5*Q]}
106cb32e2e7SValeria Barra                                         };
107cb32e2e7SValeria Barra 
108cb32e2e7SValeria Barra     for (int k=0; k<3; k++) // k = component
109cb32e2e7SValeria Barra       for (int j=0; j<3; j++) // j = direction of vg
110*9b072555Sjeremylt         vg[i+(k+j*3)*Q] = (uJ[k][0] * dXdxdXdx_T[0][j] +
111*9b072555Sjeremylt                            uJ[k][1] * dXdxdXdx_T[1][j] +
112*9b072555Sjeremylt                            uJ[k][2] * dXdxdXdx_T[2][j]);
113cb32e2e7SValeria Barra   } // End of Quadrature Point Loop
114cb32e2e7SValeria Barra 
115cb32e2e7SValeria Barra   return 0;
116cb32e2e7SValeria Barra }
117cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
118f6b55d2cSvaleriabarra 
119f6b55d2cSvaleriabarra #endif // bp4_h
120