xref: /honee/qfunctions/utils.h (revision d8667e38623468ed8757e29a58df3cbc3502b3ab)
1ae2b091fSJames Wright // SPDX-FileCopyrightText: Copyright (c) 2017-2024, HONEE contributors.
2ae2b091fSJames Wright // SPDX-License-Identifier: Apache-2.0 OR BSD-2-Clause
3c7ece6efSJeremy L Thompson #pragma once
4704b8bbeSJames Wright 
53e17a7a1SJames Wright #include <ceed/types.h>
63e17a7a1SJames Wright #ifndef CEED_RUNNING_JIT_PASS
7d0cce58aSJeremy L Thompson #include <math.h>
83e17a7a1SJames Wright #endif
9704b8bbeSJames Wright 
10704b8bbeSJames Wright #ifndef M_PI
11704b8bbeSJames Wright #define M_PI 3.14159265358979323846
12704b8bbeSJames Wright #endif
13704b8bbeSJames Wright 
14704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Max(CeedScalar a, CeedScalar b) { return a < b ? b : a; }
15704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Min(CeedScalar a, CeedScalar b) { return a < b ? a : b; }
16704b8bbeSJames Wright 
17bfa7851aSJames Wright CEED_QFUNCTION_HELPER void SwapScalar(CeedScalar *a, CeedScalar *b) {
18bfa7851aSJames Wright   CeedScalar temp = *a;
19bfa7851aSJames Wright   *a              = *b;
20bfa7851aSJames Wright   *b              = temp;
21bfa7851aSJames Wright }
22bfa7851aSJames Wright 
23704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Square(CeedScalar x) { return x * x; }
24704b8bbeSJames Wright CEED_QFUNCTION_HELPER CeedScalar Cube(CeedScalar x) { return x * x * x; }
25704b8bbeSJames Wright 
26e7754af5SKenneth E. Jansen // @brief Scale vector of length N by scalar alpha
27e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER void ScaleN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) {
288e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] *= alpha;
298e5e3595SJames Wright }
308e5e3595SJames Wright 
318e5e3595SJames Wright // @brief Set vector of length N to a value alpha
328e5e3595SJames Wright CEED_QFUNCTION_HELPER void SetValueN(CeedScalar *u, const CeedScalar alpha, const CeedInt N) {
338e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) u[i] = alpha;
348e5e3595SJames Wright }
358e5e3595SJames Wright 
368e5e3595SJames Wright // @brief Copy N elements from x to y
378e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyN(const CeedScalar *x, CeedScalar *y, const CeedInt N) { CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) y[i] = x[i]; }
388e5e3595SJames Wright 
398e5e3595SJames Wright // @brief Copy 3x3 matrix from A to B
408e5e3595SJames Wright CEED_QFUNCTION_HELPER void CopyMat3(const CeedScalar A[3][3], CeedScalar B[3][3]) { CopyN((const CeedScalar *)A, (CeedScalar *)B, 9); }
418e5e3595SJames Wright 
428e5e3595SJames Wright // @brief Dot product of vectors with N elements
438e5e3595SJames Wright CEED_QFUNCTION_HELPER CeedScalar DotN(const CeedScalar *u, const CeedScalar *v, const CeedInt N) {
448e5e3595SJames Wright   CeedScalar output = 0;
458e5e3595SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) output += u[i] * v[i];
468e5e3595SJames Wright   return output;
47e7754af5SKenneth E. Jansen }
48e7754af5SKenneth E. Jansen 
49704b8bbeSJames Wright // @brief Dot product of 3 element vectors
508fff8293SJames Wright CEED_QFUNCTION_HELPER CeedScalar Dot3(const CeedScalar *u, const CeedScalar *v) { return u[0] * v[0] + u[1] * v[1] + u[2] * v[2]; }
51704b8bbeSJames Wright 
5264667825SJames Wright // @brief \ell^2 norm of 3 element vectors
5364667825SJames Wright CEED_QFUNCTION_HELPER CeedScalar Norm3(const CeedScalar *u) { return sqrt(u[0] * u[0] + u[1] * u[1] + u[2] * u[2]); }
5464667825SJames Wright 
5583c0b726SJames Wright // @brief \ell^2 norm of 2 element vectors
5683c0b726SJames Wright CEED_QFUNCTION_HELPER CeedScalar Norm2(const CeedScalar *u) { return sqrt(u[0] * u[0] + u[1] * u[1]); }
5783c0b726SJames Wright 
588e5e3595SJames Wright // @brief Cross product of vectors with 3 elements
598e5e3595SJames Wright CEED_QFUNCTION_HELPER void Cross3(const CeedScalar u[3], const CeedScalar v[3], CeedScalar w[3]) {
608e5e3595SJames Wright   w[0] = (u[1] * v[2]) - (u[2] * v[1]);
618e5e3595SJames Wright   w[1] = (u[2] * v[0]) - (u[0] * v[2]);
628e5e3595SJames Wright   w[2] = (u[0] * v[1]) - (u[1] * v[0]);
638e5e3595SJames Wright }
648e5e3595SJames Wright 
658e5e3595SJames Wright // @brief Curl of vector given its gradient
668e5e3595SJames Wright CEED_QFUNCTION_HELPER void Curl3(const CeedScalar gradient[3][3], CeedScalar v[3]) {
678e5e3595SJames Wright   v[0] = gradient[2][1] - gradient[1][2];
688e5e3595SJames Wright   v[1] = gradient[0][2] - gradient[2][0];
698e5e3595SJames Wright   v[2] = gradient[1][0] - gradient[0][1];
708e5e3595SJames Wright }
718e5e3595SJames Wright 
728e5e3595SJames Wright // @brief Matrix vector product, b = Ax + b. A is NxM, x is M, b is N
738e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVecNM(const CeedScalar *A, const CeedScalar *x, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A,
748e5e3595SJames Wright                                     CeedScalar *b) {
758e5e3595SJames Wright   switch (transpose_A) {
768e5e3595SJames Wright     case CEED_NOTRANSPOSE:
778e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) b[i] += DotN(&A[i * M], x, M);
788e5e3595SJames Wright       break;
798e5e3595SJames Wright     case CEED_TRANSPOSE:
808e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) b[i] += A[j * M + i] * x[j]; }
818e5e3595SJames Wright       break;
828e5e3595SJames Wright   }
838e5e3595SJames Wright }
848e5e3595SJames Wright 
858e5e3595SJames Wright // @brief 3x3 Matrix vector product  b = Ax + b.
868e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatVec3(const CeedScalar A[3][3], const CeedScalar x[3], const CeedTransposeMode transpose_A, CeedScalar b[3]) {
878e5e3595SJames Wright   MatVecNM((const CeedScalar *)A, (const CeedScalar *)x, 3, 3, transpose_A, (CeedScalar *)b);
888e5e3595SJames Wright }
898e5e3595SJames Wright 
908e5e3595SJames Wright // @brief Matrix-Matrix product, B = DA + B, where D is diagonal.
918e5e3595SJames Wright // @details A is NxM, D is diagonal NxN, represented by a vector of length N, and B is NxM. Optionally, A may be transposed.
928e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiagNM(const CeedScalar *A, const CeedScalar *D, const CeedInt N, const CeedInt M, const CeedTransposeMode transpose_A,
938e5e3595SJames Wright                                      CeedScalar *B) {
948e5e3595SJames Wright   switch (transpose_A) {
958e5e3595SJames Wright     case CEED_NOTRANSPOSE:
968e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < M; j++) B[i * M + j] += D[i] * A[i * M + j]; }
978e5e3595SJames Wright       break;
988e5e3595SJames Wright     case CEED_TRANSPOSE:
998e5e3595SJames Wright       CeedPragmaSIMD for (CeedInt i = 0; i < M; i++) { CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) B[i * N + j] += D[i] * A[j * M + i]; }
1008e5e3595SJames Wright       break;
1018e5e3595SJames Wright   }
1028e5e3595SJames Wright }
1038e5e3595SJames Wright 
1048e5e3595SJames Wright // @brief 3x3 Matrix-Matrix product, B = DA + B, where D is diagonal.
1058e5e3595SJames Wright // @details Optionally, A may be transposed.
1068e5e3595SJames Wright CEED_QFUNCTION_HELPER void MatDiag3(const CeedScalar A[3][3], const CeedScalar D[3], const CeedTransposeMode transpose_A, CeedScalar B[3][3]) {
1078e5e3595SJames Wright   MatDiagNM((const CeedScalar *)A, (const CeedScalar *)D, 3, 3, transpose_A, (CeedScalar *)B);
1088e5e3595SJames Wright }
109e975cfccSJames Wright // @brief NxN Matrix-Matrix product, C = AB + C
110e975cfccSJames Wright CEED_QFUNCTION_HELPER void MatMatN(const CeedScalar *A, const CeedScalar *B, const CeedInt N, const CeedTransposeMode transpose_A,
111e975cfccSJames Wright                                    const CeedTransposeMode transpose_B, CeedScalar *C) {
1128e5e3595SJames Wright   switch (transpose_A) {
1138e5e3595SJames Wright     case CEED_NOTRANSPOSE:
1148e5e3595SJames Wright       switch (transpose_B) {
1158e5e3595SJames Wright         case CEED_NOTRANSPOSE:
116e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
117e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
118e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[i * N + k] * B[k * N + j];
119e975cfccSJames Wright             }
1208e5e3595SJames Wright           }
1218e5e3595SJames Wright           break;
1228e5e3595SJames Wright         case CEED_TRANSPOSE:
123e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
124e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
125e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[i * N + k] * B[j * N + k];
126e975cfccSJames Wright             }
1278e5e3595SJames Wright           }
1288e5e3595SJames Wright           break;
1298e5e3595SJames Wright       }
1308e5e3595SJames Wright       break;
1318e5e3595SJames Wright     case CEED_TRANSPOSE:
1328e5e3595SJames Wright       switch (transpose_B) {
1338e5e3595SJames Wright         case CEED_NOTRANSPOSE:
134e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
135e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
136e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[k * N + i] * B[k * N + j];
137e975cfccSJames Wright             }
1388e5e3595SJames Wright           }
1398e5e3595SJames Wright           break;
1408e5e3595SJames Wright         case CEED_TRANSPOSE:
141e975cfccSJames Wright           CeedPragmaSIMD for (CeedInt i = 0; i < N; i++) {
142e975cfccSJames Wright             CeedPragmaSIMD for (CeedInt j = 0; j < N; j++) {
143e975cfccSJames Wright               CeedPragmaSIMD for (CeedInt k = 0; k < N; k++) C[i * N + j] += A[k * N + i] * B[j * N + k];
144e975cfccSJames Wright             }
1458e5e3595SJames Wright           }
1468e5e3595SJames Wright           break;
1478e5e3595SJames Wright       }
1488e5e3595SJames Wright       break;
1498e5e3595SJames Wright   }
1508e5e3595SJames Wright }
1518e5e3595SJames Wright 
152e975cfccSJames Wright // @brief 3x3 Matrix-Matrix product, C = AB + C
153e975cfccSJames Wright CEED_QFUNCTION_HELPER void MatMat3(const CeedScalar A[3][3], const CeedScalar B[3][3], const CeedTransposeMode transpose_A,
154e975cfccSJames Wright                                    const CeedTransposeMode transpose_B, CeedScalar C[3][3]) {
155e975cfccSJames Wright   MatMatN((const CeedScalar *)A, (const CeedScalar *)B, 3, transpose_A, transpose_B, (CeedScalar *)C);
156e975cfccSJames Wright }
157e975cfccSJames Wright 
15806f0a019SJames Wright /**
159*d8667e38SJames Wright  * @brief Calculate inverse of 2x2 matrix
160*d8667e38SJames Wright  *
161*d8667e38SJames Wright  * @param[in]  A        Input matrix
162*d8667e38SJames Wright  * @param[out] detJ_ptr Determinate of A, may be NULL is not desired
163*d8667e38SJames Wright  * @param[out] A_inv    Output matrix inverse
164*d8667e38SJames Wright  */
165*d8667e38SJames Wright CEED_QFUNCTION_HELPER void MatInv2(const CeedScalar A[2][2], CeedScalar A_inv[2][2], CeedScalar *detJ_ptr) {
166*d8667e38SJames Wright   const CeedScalar detJ = A[0][0] * A[1][1] - A[1][0] * A[0][1];
167*d8667e38SJames Wright 
168*d8667e38SJames Wright   A_inv[0][0] = A[1][1] / detJ;
169*d8667e38SJames Wright   A_inv[0][1] = -A[0][1] / detJ;
170*d8667e38SJames Wright   A_inv[1][0] = -A[1][0] / detJ;
171*d8667e38SJames Wright   A_inv[1][1] = A[0][0] / detJ;
172*d8667e38SJames Wright   if (detJ_ptr) *detJ_ptr = detJ;
173*d8667e38SJames Wright }
174*d8667e38SJames Wright 
175*d8667e38SJames Wright /**
176*d8667e38SJames Wright  * @brief Calculate inverse of 3x3 matrix
177*d8667e38SJames Wright  *
178*d8667e38SJames Wright  * @param[in]  A        Input matrix
179*d8667e38SJames Wright  * @param[out] detJ_ptr Determinate of A, may be NULL is not desired
180*d8667e38SJames Wright  * @param[out] A_inv    Output matrix inverse
181*d8667e38SJames Wright  */
182*d8667e38SJames Wright CEED_QFUNCTION_HELPER void MatInv3(const CeedScalar A[3][3], CeedScalar A_inv[3][3], CeedScalar *detJ_ptr) {
183*d8667e38SJames Wright   // Compute Adjugate of dxdX
184*d8667e38SJames Wright   A_inv[0][0] = A[1][1] * A[2][2] - A[1][2] * A[2][1];
185*d8667e38SJames Wright   A_inv[0][1] = A[0][2] * A[2][1] - A[0][1] * A[2][2];
186*d8667e38SJames Wright   A_inv[0][2] = A[0][1] * A[1][2] - A[0][2] * A[1][1];
187*d8667e38SJames Wright   A_inv[1][0] = A[1][2] * A[2][0] - A[1][0] * A[2][2];
188*d8667e38SJames Wright   A_inv[1][1] = A[0][0] * A[2][2] - A[0][2] * A[2][0];
189*d8667e38SJames Wright   A_inv[1][2] = A[0][2] * A[1][0] - A[0][0] * A[1][2];
190*d8667e38SJames Wright   A_inv[2][0] = A[1][0] * A[2][1] - A[1][1] * A[2][0];
191*d8667e38SJames Wright   A_inv[2][1] = A[0][1] * A[2][0] - A[0][0] * A[2][1];
192*d8667e38SJames Wright   A_inv[2][2] = A[0][0] * A[1][1] - A[0][1] * A[1][0];
193*d8667e38SJames Wright 
194*d8667e38SJames Wright   const CeedScalar detJ = A[0][0] * A_inv[0][0] + A[1][0] * A_inv[0][1] + A[2][0] * A_inv[0][2];
195*d8667e38SJames Wright   ScaleN((CeedScalar *)A_inv, 1 / detJ, 9);
196*d8667e38SJames Wright   if (detJ_ptr) *detJ_ptr = detJ;
197*d8667e38SJames Wright }
198*d8667e38SJames Wright 
199*d8667e38SJames Wright /**
20006f0a019SJames Wright   @brief MxN Matrix-Matrix product, C = AB + C
20106f0a019SJames Wright 
20206f0a019SJames Wright   C is NxM, A is NxP, B is PxM
20306f0a019SJames Wright 
20406f0a019SJames Wright   @param[in]  mat_A Row-major matrix `A`
20506f0a019SJames Wright   @param[in]  mat_B Row-major matrix `B`
20606f0a019SJames Wright   @param[out] mat_C Row-major output matrix `C`
20706f0a019SJames Wright   @param[in]  N     Number of rows of `C`
20806f0a019SJames Wright   @param[in]  M     Number of columns of `C`
20906f0a019SJames Wright   @param[in]  P     Number of columns of `A`/rows of `B`
21006f0a019SJames Wright **/
21106f0a019SJames Wright CEED_QFUNCTION_HELPER void MatMatNM(const CeedScalar *mat_A, const CeedScalar *mat_B, CeedScalar *mat_C, CeedInt N, CeedInt M, CeedInt P) {
21206f0a019SJames Wright   for (CeedInt i = 0; i < N; i++) {
21306f0a019SJames Wright     for (CeedInt j = 0; j < M; j++) {
21406f0a019SJames Wright       for (CeedInt k = 0; k < P; k++) mat_C[i * M + j] += mat_A[i * P + k] * mat_B[k * M + j];
21506f0a019SJames Wright     }
21606f0a019SJames Wright   }
21706f0a019SJames Wright }
21806f0a019SJames Wright 
219704b8bbeSJames Wright // @brief Unpack Kelvin-Mandel notation symmetric tensor into full tensor
220704b8bbeSJames Wright CEED_QFUNCTION_HELPER void KMUnpack(const CeedScalar v[6], CeedScalar A[3][3]) {
221704b8bbeSJames Wright   const CeedScalar weight = 1 / sqrt(2.);
222704b8bbeSJames Wright   A[0][0]                 = v[0];
223704b8bbeSJames Wright   A[1][1]                 = v[1];
224704b8bbeSJames Wright   A[2][2]                 = v[2];
225704b8bbeSJames Wright   A[2][1] = A[1][2] = weight * v[3];
226704b8bbeSJames Wright   A[2][0] = A[0][2] = weight * v[4];
227704b8bbeSJames Wright   A[1][0] = A[0][1] = weight * v[5];
228704b8bbeSJames Wright }
229704b8bbeSJames Wright 
2308e5e3595SJames Wright // @brief Pack full tensor into Kelvin-Mandel notation symmetric tensor
2318e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMPack(const CeedScalar A[3][3], CeedScalar v[6]) {
2328e5e3595SJames Wright   const CeedScalar weight = sqrt(2.);
2338e5e3595SJames Wright   v[0]                    = A[0][0];
2348e5e3595SJames Wright   v[1]                    = A[1][1];
2358e5e3595SJames Wright   v[2]                    = A[2][2];
2368e5e3595SJames Wright   v[3]                    = A[2][1] * weight;
2378e5e3595SJames Wright   v[4]                    = A[2][0] * weight;
2388e5e3595SJames Wright   v[5]                    = A[1][0] * weight;
2398e5e3595SJames Wright }
2408e5e3595SJames Wright 
2418e5e3595SJames Wright // @brief Calculate metric tensor from mapping, g_{ij} = xi_{k,i} xi_{k,j} = dXdx^T dXdx
2428e5e3595SJames Wright CEED_QFUNCTION_HELPER void KMMetricTensor(const CeedScalar dXdx[3][3], CeedScalar km_g_ij[6]) {
2438e5e3595SJames Wright   CeedScalar g_ij[3][3] = {{0.}};
2448e5e3595SJames Wright   MatMat3(dXdx, dXdx, CEED_TRANSPOSE, CEED_NOTRANSPOSE, g_ij);
2458e5e3595SJames Wright   KMPack(g_ij, km_g_ij);
2468e5e3595SJames Wright }
2478e5e3595SJames Wright 
248e7754af5SKenneth E. Jansen // @brief Linear ramp evaluation
249e7754af5SKenneth E. Jansen CEED_QFUNCTION_HELPER CeedScalar LinearRampCoefficient(CeedScalar amplitude, CeedScalar length, CeedScalar start, CeedScalar x) {
250e7754af5SKenneth E. Jansen   if (x < start) {
251e7754af5SKenneth E. Jansen     return amplitude;
252e7754af5SKenneth E. Jansen   } else if (x < start + length) {
253e7754af5SKenneth E. Jansen     return amplitude * ((x - start) * (-1 / length) + 1);
254e7754af5SKenneth E. Jansen   } else {
255e7754af5SKenneth E. Jansen     return 0;
256e7754af5SKenneth E. Jansen   }
257e7754af5SKenneth E. Jansen }
258e7754af5SKenneth E. Jansen 
259ade49511SJames Wright /**
260ade49511SJames Wright   @brief Pack stored values at quadrature point
261ade49511SJames Wright 
262ade49511SJames Wright   @param[in]   Q              Number of quadrature points
263ade49511SJames Wright   @param[in]   i              Current quadrature point
264ade49511SJames Wright   @param[in]   start          Starting index to store components
265ade49511SJames Wright   @param[in]   num_comp       Number of components to store
2666764667bSJames Wright   @param[in]   values_at_qpnt Local values for quadrature point i
267ade49511SJames Wright   @param[out]  stored         Stored values
268ade49511SJames Wright 
269ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
270ade49511SJames Wright **/
2716764667bSJames Wright CEED_QFUNCTION_HELPER int StoredValuesPack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *values_at_qpnt,
2726764667bSJames Wright                                            CeedScalar *stored) {
2736764667bSJames Wright   for (CeedInt j = 0; j < num_comp; j++) stored[(start + j) * Q + i] = values_at_qpnt[j];
274ade49511SJames Wright 
275ade49511SJames Wright   return CEED_ERROR_SUCCESS;
276ade49511SJames Wright }
277ade49511SJames Wright 
278ade49511SJames Wright /**
279ade49511SJames Wright   @brief Unpack stored values at quadrature point
280ade49511SJames Wright 
281ade49511SJames Wright   @param[in]   Q              Number of quadrature points
282ade49511SJames Wright   @param[in]   i              Current quadrature point
283ade49511SJames Wright   @param[in]   start          Starting index to store components
284ade49511SJames Wright   @param[in]   num_comp       Number of components to store
285ade49511SJames Wright   @param[in]   stored         Stored values
2866764667bSJames Wright   @param[out]  values_at_qpnt Local values for quadrature point i
287ade49511SJames Wright 
288ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
289ade49511SJames Wright **/
2906764667bSJames Wright CEED_QFUNCTION_HELPER int StoredValuesUnpack(CeedInt Q, CeedInt i, CeedInt start, CeedInt num_comp, const CeedScalar *stored,
2916764667bSJames Wright                                              CeedScalar *values_at_qpnt) {
2926764667bSJames Wright   for (CeedInt j = 0; j < num_comp; j++) values_at_qpnt[j] = stored[(start + j) * Q + i];
293ade49511SJames Wright 
294ade49511SJames Wright   return CEED_ERROR_SUCCESS;
295ade49511SJames Wright }
296ade49511SJames Wright 
297ade49511SJames Wright /**
298e1bedf8cSJames Wright   @brief Unpack N-D element q_data at quadrature point
299e1bedf8cSJames Wright 
300e1bedf8cSJames Wright   @param[in]   dim       Dimension of the element
301e1bedf8cSJames Wright   @param[in]   Q         Number of quadrature points
302e1bedf8cSJames Wright   @param[in]   i         Current quadrature point
303e1bedf8cSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
304e1bedf8cSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
305e1bedf8cSJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [dim][dim]), or `NULL`
306e77831d2SJames Wright 
307e77831d2SJames Wright   @return An error code: 0 - success, otherwise - failure
308e1bedf8cSJames Wright **/
309e77831d2SJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_ND(CeedInt dim, CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar *dXdx) {
310e1bedf8cSJames Wright   switch (dim) {
311e1bedf8cSJames Wright     case 2:
312e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
313e1bedf8cSJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 4, q_data, dXdx);
314e1bedf8cSJames Wright       break;
315e1bedf8cSJames Wright     case 3:
316e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
317e1bedf8cSJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 9, q_data, dXdx);
318e1bedf8cSJames Wright       break;
319e1bedf8cSJames Wright   }
320e77831d2SJames Wright   return CEED_ERROR_SUCCESS;
321e1bedf8cSJames Wright }
322e1bedf8cSJames Wright 
323e1bedf8cSJames Wright /**
324e1bedf8cSJames Wright   @brief Unpack boundary element q_data for N-D problem at quadrature point
325e1bedf8cSJames Wright 
326e77831d2SJames Wright   @param[in]   dim       Dimension of the element
327e1bedf8cSJames Wright   @param[in]   Q         Number of quadrature points
328e1bedf8cSJames Wright   @param[in]   i         Current quadrature point
329e1bedf8cSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
330e1bedf8cSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
331e1bedf8cSJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [dim - 1][dim]), or `NULL`
332e1bedf8cSJames Wright   @param[out]  normal    Components of the normal vector (shape [dim]), or `NULL`
333e77831d2SJames Wright 
334e77831d2SJames Wright   @return An error code: 0 - success, otherwise - failure
335e1bedf8cSJames Wright **/
336e77831d2SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_ND(CeedInt dim, CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar *dXdx,
337e1bedf8cSJames Wright                                                  CeedScalar *normal) {
338e1bedf8cSJames Wright   switch (dim) {
339e1bedf8cSJames Wright     case 2:
340e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
341e1bedf8cSJames Wright       if (normal) StoredValuesUnpack(Q, i, 1, 2, q_data, normal);
342e1bedf8cSJames Wright       break;
343e1bedf8cSJames Wright     case 3:
344e1bedf8cSJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
345e1bedf8cSJames Wright       if (normal) StoredValuesUnpack(Q, i, 1, 3, q_data, normal);
346e1bedf8cSJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 4, 6, q_data, (CeedScalar *)dXdx);
347e1bedf8cSJames Wright       break;
348e1bedf8cSJames Wright   }
349e77831d2SJames Wright   return CEED_ERROR_SUCCESS;
350e1bedf8cSJames Wright }
351e1bedf8cSJames Wright 
352e1bedf8cSJames Wright /**
353da8b59d6SJames Wright   @brief Unpack boundary element q_data for N-D problem at quadrature point
354da8b59d6SJames Wright 
355da8b59d6SJames Wright   @param[in]   dim       Dimension of the element
356da8b59d6SJames Wright   @param[in]   Q         Number of quadrature points
357da8b59d6SJames Wright   @param[in]   i         Current quadrature point
358da8b59d6SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundaryGradient`)
359da8b59d6SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
360da8b59d6SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [dim][dim]), or `NULL`
361da8b59d6SJames Wright   @param[out]  normal    Components of the normal vector (shape [dim]), or `NULL`
362da8b59d6SJames Wright 
363da8b59d6SJames Wright   @return An error code: 0 - success, otherwise - failure
364da8b59d6SJames Wright **/
365da8b59d6SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryGradientUnpack_ND(CeedInt dim, CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ,
366da8b59d6SJames Wright                                                          CeedScalar *dXdx, CeedScalar *normal) {
367da8b59d6SJames Wright   switch (dim) {
368da8b59d6SJames Wright     case 2:
369da8b59d6SJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
370da8b59d6SJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 4, q_data, dXdx);
371da8b59d6SJames Wright       if (normal) StoredValuesUnpack(Q, i, 5, 2, q_data, normal);
372da8b59d6SJames Wright       break;
373da8b59d6SJames Wright     case 3:
374da8b59d6SJames Wright       if (wdetJ) StoredValuesUnpack(Q, i, 0, 1, q_data, wdetJ);
375da8b59d6SJames Wright       if (dXdx) StoredValuesUnpack(Q, i, 1, 9, q_data, dXdx);
376da8b59d6SJames Wright       if (normal) StoredValuesUnpack(Q, i, 10, 3, q_data, normal);
377da8b59d6SJames Wright       break;
378da8b59d6SJames Wright   }
379da8b59d6SJames Wright   return CEED_ERROR_SUCCESS;
380da8b59d6SJames Wright }
381da8b59d6SJames Wright 
382da8b59d6SJames Wright /**
383ade49511SJames Wright   @brief Unpack 3D element q_data at quadrature point
384ade49511SJames Wright 
385ade49511SJames Wright   @param[in]   Q         Number of quadrature points
386ade49511SJames Wright   @param[in]   i         Current quadrature point
387ade49511SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
388ade49511SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian
389ade49511SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [3][3])
390ade49511SJames Wright 
391ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
392ade49511SJames Wright **/
393ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[3][3]) {
394e77831d2SJames Wright   return QdataUnpack_ND(3, Q, i, q_data, wdetJ, (CeedScalar *)dXdx);
395ade49511SJames Wright }
396ade49511SJames Wright 
397ade49511SJames Wright /**
398ade49511SJames Wright   @brief Unpack boundary element q_data for 3D problem at quadrature point
399ade49511SJames Wright 
400ade49511SJames Wright   @param[in]   Q         Number of quadrature points
401ade49511SJames Wright   @param[in]   i         Current quadrature point
4022c512a7bSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
403ade49511SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
404ade49511SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][3]), or `NULL`
405ade49511SJames Wright   @param[out]  normal    Components of the normal vector (shape [3]), or `NULL`
406ade49511SJames Wright 
407ade49511SJames Wright   @return An error code: 0 - success, otherwise - failure
408ade49511SJames Wright **/
409ade49511SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][3],
410ade49511SJames Wright                                                  CeedScalar normal[3]) {
411e77831d2SJames Wright   return QdataBoundaryUnpack_ND(3, Q, i, q_data, wdetJ, (CeedScalar *)dXdx, normal);
412ade49511SJames Wright }
413ade49511SJames Wright 
414baadde1fSJames Wright /**
41515c15616SJames Wright   @brief Unpack boundary element q_data for 3D problem at quadrature point
41615c15616SJames Wright 
41715c15616SJames Wright   @param[in]   Q         Number of quadrature points
41815c15616SJames Wright   @param[in]   i         Current quadrature point
41915c15616SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
42015c15616SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
421e77831d2SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [3][3]), or `NULL`
42215c15616SJames Wright   @param[out]  normal    Components of the normal vector (shape [3]), or `NULL`
42315c15616SJames Wright 
42415c15616SJames Wright   @return An error code: 0 - success, otherwise - failure
42515c15616SJames Wright **/
426e77831d2SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryGradientUnpack_3D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[3][3],
42715c15616SJames Wright                                                          CeedScalar normal[3]) {
428da8b59d6SJames Wright   return QdataBoundaryGradientUnpack_ND(3, Q, i, q_data, wdetJ, (CeedScalar *)dXdx, normal);
42915c15616SJames Wright }
43015c15616SJames Wright 
43115c15616SJames Wright /**
432baadde1fSJames Wright   @brief Unpack 2D element q_data at quadrature point
433baadde1fSJames Wright 
434baadde1fSJames Wright   @param[in]   Q         Number of quadrature points
435baadde1fSJames Wright   @param[in]   i         Current quadrature point
436baadde1fSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:Setup`)
437baadde1fSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian
438baadde1fSJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][2])
439baadde1fSJames Wright 
440baadde1fSJames Wright   @return An error code: 0 - success, otherwise - failure
441baadde1fSJames Wright **/
442baadde1fSJames Wright CEED_QFUNCTION_HELPER int QdataUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][2]) {
443e1bedf8cSJames Wright   QdataUnpack_ND(2, Q, i, q_data, wdetJ, (CeedScalar *)dXdx);
444baadde1fSJames Wright   return CEED_ERROR_SUCCESS;
445baadde1fSJames Wright }
446baadde1fSJames Wright 
4472c512a7bSJames Wright /**
4482c512a7bSJames Wright   @brief Unpack boundary element q_data for 2D problem at quadrature point
4492c512a7bSJames Wright 
4502c512a7bSJames Wright   @param[in]   Q         Number of quadrature points
4512c512a7bSJames Wright   @param[in]   i         Current quadrature point
4522c512a7bSJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary2d`)
4532c512a7bSJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
4542c512a7bSJames Wright   @param[out]  normal    Components of the normal vector (shape [2]), or `NULL`
4552c512a7bSJames Wright 
4562c512a7bSJames Wright   @return An error code: 0 - success, otherwise - failure
4572c512a7bSJames Wright **/
4582c512a7bSJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar normal[2]) {
459e1bedf8cSJames Wright   QdataBoundaryUnpack_ND(3, Q, i, q_data, wdetJ, NULL, normal);
4602c512a7bSJames Wright   return CEED_ERROR_SUCCESS;
4612c512a7bSJames Wright }
46206f0a019SJames Wright 
46306f0a019SJames Wright /**
464da8b59d6SJames Wright   @brief Unpack boundary element q_data for 2D problem at quadrature point
465da8b59d6SJames Wright 
466da8b59d6SJames Wright   @param[in]   Q         Number of quadrature points
467da8b59d6SJames Wright   @param[in]   i         Current quadrature point
468da8b59d6SJames Wright   @param[in]   q_data    Pointer to q_data (generated by `setupgeo.h:SetupBoundary`)
469da8b59d6SJames Wright   @param[out]  wdetJ     Quadrature weight times determinant of the mapping Jacobian, or `NULL`
470da8b59d6SJames Wright   @param[out]  dXdx      Inverse of the mapping Jacobian (shape [2][2]), or `NULL`
471da8b59d6SJames Wright   @param[out]  normal    Components of the normal vector (shape [2]), or `NULL`
472da8b59d6SJames Wright 
473da8b59d6SJames Wright   @return An error code: 0 - success, otherwise - failure
474da8b59d6SJames Wright **/
475da8b59d6SJames Wright CEED_QFUNCTION_HELPER int QdataBoundaryGradientUnpack_2D(CeedInt Q, CeedInt i, const CeedScalar *q_data, CeedScalar *wdetJ, CeedScalar dXdx[2][2],
476da8b59d6SJames Wright                                                          CeedScalar normal[2]) {
477da8b59d6SJames Wright   return QdataBoundaryGradientUnpack_ND(2, Q, i, q_data, wdetJ, (CeedScalar *)dXdx, normal);
478da8b59d6SJames Wright }
479da8b59d6SJames Wright 
480da8b59d6SJames Wright /**
48106f0a019SJames Wright   @brief Unpack `CEED_EVAL_GRAD` QF input into quadrature-point local array
48206f0a019SJames Wright 
48306f0a019SJames Wright   @param[in]  Q          Number of quadrature points
48406f0a019SJames Wright   @param[in]  i          Current quadrature point
48506f0a019SJames Wright   @param[in]  num_comp   Number of components of the input
48606f0a019SJames Wright   @param[in]  dim        Topological dimension of the element (ie. number of derivative terms per component)
48706f0a019SJames Wright   @param[in]  grad       QF gradient input, shape `[dim][num_comp][Q]`
488db7fbcd2SJames Wright   @param[out] grad_local Gradient array at quadrature point Q, shape `[num_comp][dim]`
48906f0a019SJames Wright **/
490db7fbcd2SJames Wright CEED_QFUNCTION_HELPER void GradUnpackN(CeedInt Q, CeedInt i, CeedInt num_comp, CeedInt dim, const CeedScalar *grad, CeedScalar *grad_local) {
49106f0a019SJames Wright   for (CeedInt d = 0; d < dim; d++) {
49206f0a019SJames Wright     for (CeedInt c = 0; c < num_comp; c++) {
493db7fbcd2SJames Wright       grad_local[dim * c + d] = grad[(Q * num_comp) * d + Q * c + i];
49406f0a019SJames Wright     }
49506f0a019SJames Wright   }
49606f0a019SJames Wright }
49706f0a019SJames Wright 
49806f0a019SJames Wright /**
49906f0a019SJames Wright   @brief Unpack `CEED_EVAL_GRAD` QF input into quadrature-point local array for 3D elements
50006f0a019SJames Wright 
50106f0a019SJames Wright   @param[in]  Q          Number of quadrature points
50206f0a019SJames Wright   @param[in]  i          Current quadrature point
50306f0a019SJames Wright   @param[in]  num_comp   Number of components of the input
50483c0b726SJames Wright   @param[in]  grad       QF gradient input, shape `[3][num_comp][Q]`
505db7fbcd2SJames Wright   @param[out] grad_local Gradient array at quadrature point Q, shape `[num_comp][3]`
50606f0a019SJames Wright **/
507db7fbcd2SJames Wright CEED_QFUNCTION_HELPER void GradUnpack3(CeedInt Q, CeedInt i, CeedInt num_comp, const CeedScalar *grad, CeedScalar (*grad_local)[3]) {
508db7fbcd2SJames Wright   GradUnpackN(Q, i, num_comp, 3, grad, (CeedScalar *)grad_local);
50906f0a019SJames Wright }
5108c85b835SJames Wright 
5118c85b835SJames Wright /**
51283c0b726SJames Wright   @brief Unpack `CEED_EVAL_GRAD` QF input into quadrature-point local array for 2D elements
51383c0b726SJames Wright 
51483c0b726SJames Wright   @param[in]  Q          Number of quadrature points
51583c0b726SJames Wright   @param[in]  i          Current quadrature point
51683c0b726SJames Wright   @param[in]  num_comp   Number of components of the input
51783c0b726SJames Wright   @param[in]  grad       QF gradient input, shape `[2][num_comp][Q]`
518db7fbcd2SJames Wright   @param[out] grad_local Gradient array at quadrature point Q, shape `[num_comp][2]`
51983c0b726SJames Wright **/
520db7fbcd2SJames Wright CEED_QFUNCTION_HELPER void GradUnpack2(CeedInt Q, CeedInt i, CeedInt num_comp, const CeedScalar *grad, CeedScalar (*grad_local)[2]) {
521db7fbcd2SJames Wright   GradUnpackN(Q, i, num_comp, 2, grad, (CeedScalar *)grad_local);
52283c0b726SJames Wright }
52383c0b726SJames Wright 
52483c0b726SJames Wright /**
5258c85b835SJames Wright   @brief Calculate divergence from reference gradient
5268c85b835SJames Wright 
5278c85b835SJames Wright   Given gradient array G_{ij} and inverse element mapping X_{ij}, then the divergence is
5288c85b835SJames Wright 
5298c85b835SJames Wright   G_{ij} X{ji}
5308c85b835SJames Wright 
5318c85b835SJames Wright   @param[in]  grad_qn    Gradient array, orientation [vector component][gradient direction]
5328c85b835SJames Wright   @param[in]  dXdx       Inverse of the mapping Jacobian (shape [dim][dim])
5338c85b835SJames Wright   @param[in]  dim        Dimension of the problem
5348c85b835SJames Wright   @param[out] divergence The divergence
5358c85b835SJames Wright **/
5368c85b835SJames Wright CEED_QFUNCTION_HELPER void DivergenceND(const CeedScalar *grad_qn, const CeedScalar *dXdx, const CeedInt dim, CeedScalar *divergence) {
5378c85b835SJames Wright   for (CeedInt i = 0; i < dim; i++) {
5388c85b835SJames Wright     for (CeedInt j = 0; j < dim; j++) {
5398c85b835SJames Wright       *divergence += grad_qn[i * dim + j] * dXdx[j * dim + i];
5408c85b835SJames Wright     }
5418c85b835SJames Wright   }
5428c85b835SJames Wright }
5438c85b835SJames Wright 
5448c85b835SJames Wright /**
5458c85b835SJames Wright   @brief Calculate divergence from reference gradient for 3D problem
5468c85b835SJames Wright 
5478c85b835SJames Wright   Given gradient array G_{ij} and inverse element mapping X_{ij}, then the divergence is
5488c85b835SJames Wright 
5498c85b835SJames Wright   G_{ij} X{ji}
5508c85b835SJames Wright 
5518c85b835SJames Wright   @param[in]  grad_qn    Gradient array, orientation [vector component][gradient direction]
5528c85b835SJames Wright   @param[in]  dXdx       Inverse of the mapping Jacobian (shape [3][3])
5538c85b835SJames Wright   @param[out] divergence The divergence
5548c85b835SJames Wright **/
5558c85b835SJames Wright CEED_QFUNCTION_HELPER void Divergence3D(const CeedScalar grad_qn[3][3], const CeedScalar dXdx[3][3], CeedScalar *divergence) {
5568c85b835SJames Wright   DivergenceND((const CeedScalar *)grad_qn, (const CeedScalar *)dXdx, 3, divergence);
5578c85b835SJames Wright }
558