xref: /libCEED/examples/petsc/qfunctions/bps/bp3.h (revision 2b730f8b5a9c809740a0b3b302db43a719c636b1)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3cb32e2e7SValeria Barra //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
5cb32e2e7SValeria Barra //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
7cb32e2e7SValeria Barra 
8cb32e2e7SValeria Barra /// @file
9cb32e2e7SValeria Barra /// libCEED QFunctions for diffusion operator example using PETSc
10cb32e2e7SValeria Barra 
1113921685Svaleriabarra #ifndef bp3_h
1213921685Svaleriabarra #define bp3_h
1313921685Svaleriabarra 
14c9c2c079SJeremy L Thompson #include <ceed.h>
1513921685Svaleriabarra #include <math.h>
1613921685Svaleriabarra 
17e83e87a5Sjeremylt // -----------------------------------------------------------------------------
18ed264d09SValeria Barra // This QFunction sets up the geometric factors required to apply the
19ed264d09SValeria Barra //   diffusion operator
20ed264d09SValeria Barra //
21ed264d09SValeria Barra // We require the product of the inverse of the Jacobian and its transpose to
22ed264d09SValeria Barra //   properly compute integrals of the form: int( gradv gradu)
23ed264d09SValeria Barra //
24ed264d09SValeria Barra // Determinant of Jacobian:
25ed264d09SValeria Barra //   detJ = J11*A11 + J21*A12 + J31*A13
26ed264d09SValeria Barra //     Jij = Jacobian entry ij
27ed264d09SValeria Barra //     Aij = Adjoint ij
28ed264d09SValeria Barra //
29ed264d09SValeria Barra // Inverse of Jacobian:
30ed264d09SValeria Barra //   Bij = Aij / detJ
31ed264d09SValeria Barra //
32ed264d09SValeria Barra // Product of Inverse and Transpose:
33ed264d09SValeria Barra //   BBij = sum( Bik Bkj )
34ed264d09SValeria Barra //
35ed264d09SValeria Barra // Stored: w B^T B detJ = w A^T A / detJ
36ed264d09SValeria Barra //   Note: This matrix is symmetric, so we only store 6 distinct entries
370a8fc04aSrezgarshakeri //     qd: 1 4 7
38ed264d09SValeria Barra //         2 5 8
390a8fc04aSrezgarshakeri //         3 6 9
40cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
41*2b730f8bSJeremy L Thompson CEED_QFUNCTION(SetupDiffGeo)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
42d4d45553Srezgarshakeri   // Inputs
43d4d45553Srezgarshakeri   const CeedScalar(*J)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[1];
44d4d45553Srezgarshakeri   const CeedScalar(*w)                = in[2];  // Note: *X = in[0]
45d4d45553Srezgarshakeri   // Outputs
46d4d45553Srezgarshakeri   CeedScalar(*qd) = out[0];
47cb32e2e7SValeria Barra 
48d4d45553Srezgarshakeri   const CeedInt dim = 3;
49cb32e2e7SValeria Barra   // Quadrature Point Loop
50*2b730f8bSJeremy L Thompson   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
51d4d45553Srezgarshakeri     // Setup
52d4d45553Srezgarshakeri     CeedScalar A[3][3];
53d4d45553Srezgarshakeri     for (CeedInt j = 0; j < dim; j++) {
54d4d45553Srezgarshakeri       for (CeedInt k = 0; k < dim; k++) {
55d4d45553Srezgarshakeri         // Equivalent code with no mod operations:
56d4d45553Srezgarshakeri         // A[k][j] = J[k+1][j+1]*J[k+2][j+2] - J[k+1][j+2]*J[k+2][j+1]
57d4d45553Srezgarshakeri         A[k][j] = J[(k + 1) % dim][(j + 1) % dim][i] * J[(k + 2) % dim][(j + 2) % dim][i] -
58d4d45553Srezgarshakeri                   J[(k + 1) % dim][(j + 2) % dim][i] * J[(k + 2) % dim][(j + 1) % dim][i];
59d4d45553Srezgarshakeri       }
60d4d45553Srezgarshakeri     }
61d4d45553Srezgarshakeri     const CeedScalar detJ = J[0][0][i] * A[0][0] + J[0][1][i] * A[0][1] + J[0][2][i] * A[0][2];
62d4d45553Srezgarshakeri 
63d4d45553Srezgarshakeri     const CeedScalar qw = w[i] / detJ;
640a8fc04aSrezgarshakeri     qd[i + Q * 0]       = w[i] * detJ;
650a8fc04aSrezgarshakeri     qd[i + Q * 1]       = qw * (A[0][0] * A[0][0] + A[0][1] * A[0][1] + A[0][2] * A[0][2]);
660a8fc04aSrezgarshakeri     qd[i + Q * 2]       = qw * (A[0][0] * A[1][0] + A[0][1] * A[1][1] + A[0][2] * A[1][2]);
670a8fc04aSrezgarshakeri     qd[i + Q * 3]       = qw * (A[0][0] * A[2][0] + A[0][1] * A[2][1] + A[0][2] * A[2][2]);
680a8fc04aSrezgarshakeri     qd[i + Q * 4]       = qw * (A[1][0] * A[1][0] + A[1][1] * A[1][1] + A[1][2] * A[1][2]);
690a8fc04aSrezgarshakeri     qd[i + Q * 5]       = qw * (A[1][0] * A[2][0] + A[1][1] * A[2][1] + A[1][2] * A[2][2]);
700a8fc04aSrezgarshakeri     qd[i + Q * 6]       = qw * (A[2][0] * A[2][0] + A[2][1] * A[2][1] + A[2][2] * A[2][2]);
71cb32e2e7SValeria Barra   }  // End of Quadrature Point Loop
72cb32e2e7SValeria Barra 
73cb32e2e7SValeria Barra   return 0;
74cb32e2e7SValeria Barra }
75cb32e2e7SValeria Barra 
76e83e87a5Sjeremylt // -----------------------------------------------------------------------------
77ed264d09SValeria Barra // This QFunction sets up the rhs and true solution for the problem
78cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
79*2b730f8bSJeremy L Thompson CEED_QFUNCTION(SetupDiffRhs)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
80cb32e2e7SValeria Barra #ifndef M_PI
81cb32e2e7SValeria Barra #define M_PI 3.14159265358979323846
82cb32e2e7SValeria Barra #endif
83e83e87a5Sjeremylt   const CeedScalar *x = in[0], *w = in[1];
84cb32e2e7SValeria Barra   CeedScalar       *true_soln = out[0], *rhs = out[1];
85cb32e2e7SValeria Barra 
86cb32e2e7SValeria Barra   // Quadrature Point Loop
87*2b730f8bSJeremy L Thompson   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
88cb32e2e7SValeria Barra     const CeedScalar c[3] = {0, 1., 2.};
89cb32e2e7SValeria Barra     const CeedScalar k[3] = {1., 2., 3.};
90cb32e2e7SValeria Barra 
91*2b730f8bSJeremy L Thompson     true_soln[i] = sin(M_PI * (c[0] + k[0] * x[i + Q * 0])) * sin(M_PI * (c[1] + k[1] * x[i + Q * 1])) * sin(M_PI * (c[2] + k[2] * x[i + Q * 2]));
92cb32e2e7SValeria Barra 
93*2b730f8bSJeremy L Thompson     rhs[i] = w[i + Q * 0] * M_PI * M_PI * (k[0] * k[0] + k[1] * k[1] + k[2] * k[2]) * true_soln[i];
94cb32e2e7SValeria Barra   }  // End of Quadrature Point Loop
95cb32e2e7SValeria Barra 
96cb32e2e7SValeria Barra   return 0;
97cb32e2e7SValeria Barra }
98cb32e2e7SValeria Barra 
99e83e87a5Sjeremylt // -----------------------------------------------------------------------------
100ed264d09SValeria Barra // This QFunction applies the diffusion operator for a scalar field.
101ed264d09SValeria Barra //
102ed264d09SValeria Barra // Inputs:
103ed264d09SValeria Barra //   ug     - Input vector gradient at quadrature points
1049b072555Sjeremylt //   q_data  - Geometric factors
105ed264d09SValeria Barra //
106ed264d09SValeria Barra // Output:
107ed264d09SValeria Barra //   vg     - Output vector (test functions) gradient at quadrature points
108ed264d09SValeria Barra //
109cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
110*2b730f8bSJeremy L Thompson CEED_QFUNCTION(Diff)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
1119b072555Sjeremylt   const CeedScalar *ug = in[0], *q_data = in[1];
112cb32e2e7SValeria Barra   CeedScalar       *vg = out[0];
113cb32e2e7SValeria Barra 
114cb32e2e7SValeria Barra   // Quadrature Point Loop
115*2b730f8bSJeremy L Thompson   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
116cb32e2e7SValeria Barra     // Read spatial derivatives of u
117*2b730f8bSJeremy L Thompson     const CeedScalar du[3] = {ug[i + Q * 0], ug[i + Q * 1], ug[i + Q * 2]};
1189b072555Sjeremylt     // Read q_data (dXdxdXdx_T symmetric matrix)
119*2b730f8bSJeremy L Thompson     const CeedScalar dXdxdXdx_T[3][3] = {
120*2b730f8bSJeremy L Thompson         {q_data[i + 1 * Q], q_data[i + 2 * Q], q_data[i + 3 * Q]},
121*2b730f8bSJeremy L Thompson         {q_data[i + 2 * Q], q_data[i + 4 * Q], q_data[i + 5 * Q]},
122*2b730f8bSJeremy L Thompson         {q_data[i + 3 * Q], q_data[i + 5 * Q], q_data[i + 6 * Q]}
123cb32e2e7SValeria Barra     };
124cb32e2e7SValeria Barra 
125*2b730f8bSJeremy L Thompson     for (int j = 0; j < 3; j++) {  // j = direction of vg
126*2b730f8bSJeremy L Thompson       vg[i + j * Q] = (du[0] * dXdxdXdx_T[0][j] + du[1] * dXdxdXdx_T[1][j] + du[2] * dXdxdXdx_T[2][j]);
127*2b730f8bSJeremy L Thompson     }
128cb32e2e7SValeria Barra   }  // End of Quadrature Point Loop
129cb32e2e7SValeria Barra   return 0;
130cb32e2e7SValeria Barra }
131cb32e2e7SValeria Barra // -----------------------------------------------------------------------------
132f6b55d2cSvaleriabarra 
133f6b55d2cSvaleriabarra #endif  // bp3_h
134