xref: /libCEED/examples/fluids/qfunctions/newtonian.h (revision 88626eed6564cd43033d3137230605fb5f962840)
13d8e8822SJeremy L Thompson // Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
23d8e8822SJeremy L Thompson // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
388b783a1SJames Wright //
43d8e8822SJeremy L Thompson // SPDX-License-Identifier: BSD-2-Clause
588b783a1SJames Wright //
63d8e8822SJeremy L Thompson // This file is part of CEED:  http://github.com/ceed
788b783a1SJames Wright 
888b783a1SJames Wright /// @file
988b783a1SJames Wright /// Operator for Navier-Stokes example using PETSc
1088b783a1SJames Wright 
1188b783a1SJames Wright 
1288b783a1SJames Wright #ifndef newtonian_h
1388b783a1SJames Wright #define newtonian_h
1488b783a1SJames Wright 
1588b783a1SJames Wright #include <math.h>
1688b783a1SJames Wright #include <ceed.h>
1788b783a1SJames Wright 
1888b783a1SJames Wright #ifndef M_PI
1988b783a1SJames Wright #define M_PI    3.14159265358979323846
2088b783a1SJames Wright #endif
2188b783a1SJames Wright 
2288b783a1SJames Wright #ifndef setup_context_struct
2388b783a1SJames Wright #define setup_context_struct
2488b783a1SJames Wright typedef struct SetupContext_ *SetupContext;
2588b783a1SJames Wright struct SetupContext_ {
2688b783a1SJames Wright   CeedScalar theta0;
2788b783a1SJames Wright   CeedScalar thetaC;
2888b783a1SJames Wright   CeedScalar P0;
2988b783a1SJames Wright   CeedScalar N;
3088b783a1SJames Wright   CeedScalar cv;
3188b783a1SJames Wright   CeedScalar cp;
32*88626eedSJames Wright   CeedScalar g[3];
3388b783a1SJames Wright   CeedScalar rc;
3488b783a1SJames Wright   CeedScalar lx;
3588b783a1SJames Wright   CeedScalar ly;
3688b783a1SJames Wright   CeedScalar lz;
3788b783a1SJames Wright   CeedScalar center[3];
3888b783a1SJames Wright   CeedScalar dc_axis[3];
3988b783a1SJames Wright   CeedScalar wind[3];
4088b783a1SJames Wright   CeedScalar time;
4188b783a1SJames Wright   int wind_type;              // See WindType: 0=ROTATION, 1=TRANSLATION
4288b783a1SJames Wright   int bubble_type;            // See BubbleType: 0=SPHERE, 1=CYLINDER
4388b783a1SJames Wright   int bubble_continuity_type; // See BubbleContinuityType: 0=SMOOTH, 1=BACK_SHARP 2=THICK
4488b783a1SJames Wright };
4588b783a1SJames Wright #endif
4688b783a1SJames Wright 
4788b783a1SJames Wright #ifndef newtonian_context_struct
4888b783a1SJames Wright #define newtonian_context_struct
4988b783a1SJames Wright typedef enum {
5088b783a1SJames Wright   STAB_NONE = 0,
5188b783a1SJames Wright   STAB_SU   = 1, // Streamline Upwind
5288b783a1SJames Wright   STAB_SUPG = 2, // Streamline Upwind Petrov-Galerkin
5388b783a1SJames Wright } StabilizationType;
5488b783a1SJames Wright 
5588b783a1SJames Wright typedef struct NewtonianIdealGasContext_ *NewtonianIdealGasContext;
5688b783a1SJames Wright struct NewtonianIdealGasContext_ {
5788b783a1SJames Wright   CeedScalar lambda;
5888b783a1SJames Wright   CeedScalar mu;
5988b783a1SJames Wright   CeedScalar k;
6088b783a1SJames Wright   CeedScalar cv;
6188b783a1SJames Wright   CeedScalar cp;
62*88626eedSJames Wright   CeedScalar g[3];
6388b783a1SJames Wright   CeedScalar c_tau;
64*88626eedSJames Wright   CeedScalar Ctau_t;
65*88626eedSJames Wright   CeedScalar Ctau_v;
66*88626eedSJames Wright   CeedScalar Ctau_C;
67*88626eedSJames Wright   CeedScalar Ctau_M;
68*88626eedSJames Wright   CeedScalar Ctau_E;
69*88626eedSJames Wright   CeedScalar dt;
7088b783a1SJames Wright   StabilizationType stabilization;
7188b783a1SJames Wright };
7288b783a1SJames Wright #endif
7388b783a1SJames Wright 
7488b783a1SJames Wright // *****************************************************************************
7588b783a1SJames Wright // Helper function for computing flux Jacobian
7688b783a1SJames Wright // *****************************************************************************
7788b783a1SJames Wright CEED_QFUNCTION_HELPER void computeFluxJacobian_NS(CeedScalar dF[3][5][5],
7888b783a1SJames Wright     const CeedScalar rho, const CeedScalar u[3], const CeedScalar E,
79*88626eedSJames Wright     const CeedScalar gamma, const CeedScalar g[3], const CeedScalar x[3]) {
8088b783a1SJames Wright   CeedScalar u_sq = u[0]*u[0] + u[1]*u[1] + u[2]*u[2]; // Velocity square
81*88626eedSJames Wright   CeedScalar e_potential = -(g[0]*x[0] + g[1]*x[1] + g[2]*x[2]);
8288b783a1SJames Wright   for (CeedInt i=0; i<3; i++) { // Jacobian matrices for 3 directions
8388b783a1SJames Wright     for (CeedInt j=0; j<3; j++) { // Rows of each Jacobian matrix
84*88626eedSJames Wright       dF[i][j+1][0] = ((i==j) ? ((gamma-1.)*(u_sq/2. - e_potential)) : 0.) -
85*88626eedSJames Wright                       u[i]*u[j];
8688b783a1SJames Wright       for (CeedInt k=0; k<3; k++) { // Columns of each Jacobian matrix
8788b783a1SJames Wright         dF[i][0][k+1]   = ((i==k) ? 1. : 0.);
8888b783a1SJames Wright         dF[i][j+1][k+1] = ((j==k) ? u[i] : 0.) +
8988b783a1SJames Wright                           ((i==k) ? u[j] : 0.) -
9088b783a1SJames Wright                           ((i==j) ? u[k] : 0.) * (gamma-1.);
9188b783a1SJames Wright         dF[i][4][k+1]   = ((i==k) ? (E*gamma/rho - (gamma-1.)*u_sq/2.) : 0.) -
9288b783a1SJames Wright                           (gamma-1.)*u[i]*u[k];
9388b783a1SJames Wright       }
9488b783a1SJames Wright       dF[i][j+1][4] = ((i==j) ? (gamma-1.) : 0.);
9588b783a1SJames Wright     }
9688b783a1SJames Wright     dF[i][4][0] = u[i] * ((gamma-1.)*u_sq - E*gamma/rho);
9788b783a1SJames Wright     dF[i][4][4] = u[i] * gamma;
9888b783a1SJames Wright   }
9988b783a1SJames Wright }
10088b783a1SJames Wright 
10188b783a1SJames Wright // *****************************************************************************
102*88626eedSJames Wright // Helper function for computing flux Jacobian of Primitive variables
103*88626eedSJames Wright // *****************************************************************************
104*88626eedSJames Wright CEED_QFUNCTION_HELPER void computeFluxJacobian_NSp(CeedScalar dF[3][5][5],
105*88626eedSJames Wright     const CeedScalar rho, const CeedScalar u[3], const CeedScalar E,
106*88626eedSJames Wright     const CeedScalar Rd, const CeedScalar cv) {
107*88626eedSJames Wright   CeedScalar u_sq = u[0]*u[0] + u[1]*u[1] + u[2]*u[2]; // Velocity square
108*88626eedSJames Wright   // TODO Add in gravity's contribution
109*88626eedSJames Wright 
110*88626eedSJames Wright   CeedScalar T    = ( E / rho - u_sq / 2. ) / cv;
111*88626eedSJames Wright   CeedScalar drdT = -rho / T;
112*88626eedSJames Wright   CeedScalar drdP = 1. / ( Rd * T);
113*88626eedSJames Wright   CeedScalar etot =  E / rho ;
114*88626eedSJames Wright   CeedScalar e2p  = drdP * etot + 1. ;
115*88626eedSJames Wright   CeedScalar e3p  = ( E  + rho * Rd * T );
116*88626eedSJames Wright   CeedScalar e4p  = drdT * etot + rho * cv ;
117*88626eedSJames Wright 
118*88626eedSJames Wright   for (CeedInt i=0; i<3; i++) { // Jacobian matrices for 3 directions
119*88626eedSJames Wright     for (CeedInt j=0; j<3; j++) { // j counts F^{m_j}
120*88626eedSJames Wright //        [row][col] of A_i
121*88626eedSJames Wright       dF[i][j+1][0] = drdP * u[i] * u[j] + ((i==j) ? 1. : 0.); // F^{{m_j} wrt p
122*88626eedSJames Wright       for (CeedInt k=0; k<3; k++) { // k counts the wrt vel_k
123*88626eedSJames Wright         // this loop handles middle columns for all 5 rows
124*88626eedSJames Wright         dF[i][0][k+1]   =  ((i==k) ? rho  : 0.);   // F^c wrt vel_k
125*88626eedSJames Wright         dF[i][j+1][k+1] = (((j==k) ? u[i] : 0.) +  // F^m_j wrt u_k
126*88626eedSJames Wright                            ((i==k) ? u[j] : 0.) ) * rho;
127*88626eedSJames Wright         dF[i][4][k+1]   = rho * u[i] * u[k]
128*88626eedSJames Wright                           + ((i==k) ? e3p  : 0.) ; // F^e wrt u_k
129*88626eedSJames Wright       }
130*88626eedSJames Wright       dF[i][j+1][4] = drdT * u[i] * u[j]; // F^{m_j} wrt T
131*88626eedSJames Wright     }
132*88626eedSJames Wright     dF[i][4][0] = u[i] * e2p; // F^e wrt p
133*88626eedSJames Wright     dF[i][4][4] = u[i] * e4p; // F^e wrt T
134*88626eedSJames Wright     dF[i][0][0] = u[i] * drdP; // F^c wrt p
135*88626eedSJames Wright     dF[i][0][4] = u[i] * drdT; // F^c wrt T
136*88626eedSJames Wright   }
137*88626eedSJames Wright }
138*88626eedSJames Wright 
139*88626eedSJames Wright CEED_QFUNCTION_HELPER void PrimitiveToConservative_fwd(const CeedScalar rho,
140*88626eedSJames Wright     const CeedScalar u[3], const CeedScalar E, const CeedScalar Rd,
141*88626eedSJames Wright     const CeedScalar cv, const CeedScalar dY[5], CeedScalar dU[5]) {
142*88626eedSJames Wright   CeedScalar u_sq = u[0]*u[0] + u[1]*u[1] + u[2]*u[2];
143*88626eedSJames Wright   CeedScalar T    = ( E / rho - u_sq / 2. ) / cv;
144*88626eedSJames Wright   CeedScalar drdT = -rho / T;
145*88626eedSJames Wright   CeedScalar drdP = 1. / ( Rd * T);
146*88626eedSJames Wright   dU[0] = drdP * dY[0] + drdT * dY[4];
147*88626eedSJames Wright   CeedScalar de_kinetic = 0;
148*88626eedSJames Wright   for (int i=0; i<3; i++) {
149*88626eedSJames Wright     dU[1+i] = dU[0] * u[i] + rho * dY[1+i];
150*88626eedSJames Wright     de_kinetic += u[i] * dY[1+i];
151*88626eedSJames Wright   }
152*88626eedSJames Wright   dU[4] = rho * cv * dY[4] + dU[0] * cv * T // internal energy: rho * e
153*88626eedSJames Wright           + rho * de_kinetic + .5 * dU[0] * u_sq; // kinetic energy: .5 * rho * |u|^2
154*88626eedSJames Wright }
155*88626eedSJames Wright 
156*88626eedSJames Wright // *****************************************************************************
157*88626eedSJames Wright // Helper function for computing Tau elements (stabilization constant)
158*88626eedSJames Wright //   Model from:
159*88626eedSJames Wright //     PHASTA
160*88626eedSJames Wright //
161*88626eedSJames Wright //   Tau[i] = itau=0 which is diagonal-Shakib (3 values still but not spatial)
162*88626eedSJames Wright //
163*88626eedSJames Wright // Where NOT UPDATED YET
164*88626eedSJames Wright // *****************************************************************************
165*88626eedSJames Wright CEED_QFUNCTION_HELPER void Tau_diagPrim(CeedScalar Tau_d[3],
166*88626eedSJames Wright                                         const CeedScalar dXdx[3][3], const CeedScalar u[3],
167*88626eedSJames Wright                                         const CeedScalar cv, const NewtonianIdealGasContext newt_ctx,
168*88626eedSJames Wright                                         const CeedScalar mu, const CeedScalar dt,
169*88626eedSJames Wright                                         const CeedScalar rho) {
170*88626eedSJames Wright   // Context
171*88626eedSJames Wright   const CeedScalar Ctau_t = newt_ctx->Ctau_t;
172*88626eedSJames Wright   const CeedScalar Ctau_v = newt_ctx->Ctau_v;
173*88626eedSJames Wright   const CeedScalar Ctau_C = newt_ctx->Ctau_C;
174*88626eedSJames Wright   const CeedScalar Ctau_M = newt_ctx->Ctau_M;
175*88626eedSJames Wright   const CeedScalar Ctau_E = newt_ctx->Ctau_E;
176*88626eedSJames Wright   CeedScalar gijd[6];
177*88626eedSJames Wright   CeedScalar tau;
178*88626eedSJames Wright   CeedScalar dts;
179*88626eedSJames Wright   CeedScalar fact;
180*88626eedSJames Wright 
181*88626eedSJames Wright   //*INDENT-OFF*
182*88626eedSJames Wright   gijd[0] =   dXdx[0][0] * dXdx[0][0]
183*88626eedSJames Wright             + dXdx[1][0] * dXdx[1][0]
184*88626eedSJames Wright             + dXdx[2][0] * dXdx[2][0];
185*88626eedSJames Wright 
186*88626eedSJames Wright   gijd[1] =   dXdx[0][0] * dXdx[0][1]
187*88626eedSJames Wright             + dXdx[1][0] * dXdx[1][1]
188*88626eedSJames Wright             + dXdx[2][0] * dXdx[2][1];
189*88626eedSJames Wright 
190*88626eedSJames Wright   gijd[2] =   dXdx[0][1] * dXdx[0][1]
191*88626eedSJames Wright             + dXdx[1][1] * dXdx[1][1]
192*88626eedSJames Wright             + dXdx[2][1] * dXdx[2][1];
193*88626eedSJames Wright 
194*88626eedSJames Wright   gijd[3] =   dXdx[0][0] * dXdx[0][2]
195*88626eedSJames Wright             + dXdx[1][0] * dXdx[1][2]
196*88626eedSJames Wright             + dXdx[2][0] * dXdx[2][2];
197*88626eedSJames Wright 
198*88626eedSJames Wright   gijd[4] =   dXdx[0][1] * dXdx[0][2]
199*88626eedSJames Wright             + dXdx[1][1] * dXdx[1][2]
200*88626eedSJames Wright             + dXdx[2][1] * dXdx[2][2];
201*88626eedSJames Wright 
202*88626eedSJames Wright   gijd[5] =   dXdx[0][2] * dXdx[0][2]
203*88626eedSJames Wright             + dXdx[1][2] * dXdx[1][2]
204*88626eedSJames Wright             + dXdx[2][2] * dXdx[2][2];
205*88626eedSJames Wright   //*INDENT-ON*
206*88626eedSJames Wright 
207*88626eedSJames Wright   dts = Ctau_t / dt ;
208*88626eedSJames Wright 
209*88626eedSJames Wright   tau = rho*rho*((4. * dts * dts)
210*88626eedSJames Wright                  + u[0] * ( u[0] * gijd[0] + 2. * ( u[1] * gijd[1] + u[2] * gijd[3]))
211*88626eedSJames Wright                  + u[1] * ( u[1] * gijd[2] + 2. *   u[2] * gijd[4])
212*88626eedSJames Wright                  + u[2] *   u[2] * gijd[5])
213*88626eedSJames Wright         + Ctau_v* mu * mu *
214*88626eedSJames Wright         (gijd[0]*gijd[0] + gijd[2]*gijd[2] + gijd[5]*gijd[5] +
215*88626eedSJames Wright          + 2. * (gijd[1]*gijd[1] + gijd[3]*gijd[3] + gijd[4]*gijd[4]));
216*88626eedSJames Wright 
217*88626eedSJames Wright   fact=sqrt(tau);
218*88626eedSJames Wright 
219*88626eedSJames Wright   Tau_d[0] = Ctau_C * fact / (rho*(gijd[0] + gijd[2] + gijd[5]))*0.125;
220*88626eedSJames Wright 
221*88626eedSJames Wright   Tau_d[1] = Ctau_M / fact;
222*88626eedSJames Wright   Tau_d[2] = Ctau_E / ( fact * cv );
223*88626eedSJames Wright 
224*88626eedSJames Wright // consider putting back the way I initially had it  Ctau_E * Tau_d[1] /cv
225*88626eedSJames Wright //  to avoid a division if the compiler is smart enough to see that cv IS
226*88626eedSJames Wright // a constant that it could invert once for all elements
227*88626eedSJames Wright // but in that case energy tau is scaled by the product of Ctau_E * Ctau_M
228*88626eedSJames Wright // OR we could absorb cv into Ctau_E but this puts more burden on user to
229*88626eedSJames Wright // know how to change constants with a change of fluid or units.  Same for
230*88626eedSJames Wright // Ctau_v * mu * mu IF AND ONLY IF we don't add viscosity law =f(T)
231*88626eedSJames Wright }
232*88626eedSJames Wright 
233*88626eedSJames Wright // *****************************************************************************
23488b783a1SJames Wright // Helper function for computing Tau elements (stabilization constant)
23588b783a1SJames Wright //   Model from:
23688b783a1SJames Wright //     Stabilized Methods for Compressible Flows, Hughes et al 2010
23788b783a1SJames Wright //
23888b783a1SJames Wright //   Spatial criterion #2 - Tau is a 3x3 diagonal matrix
23988b783a1SJames Wright //   Tau[i] = c_tau h[i] Xi(Pe) / rho(A[i]) (no sum)
24088b783a1SJames Wright //
24188b783a1SJames Wright // Where
24288b783a1SJames Wright //   c_tau     = stabilization constant (0.5 is reported as "optimal")
24388b783a1SJames Wright //   h[i]      = 2 length(dxdX[i])
24488b783a1SJames Wright //   Pe        = Peclet number ( Pe = sqrt(u u) / dot(dXdx,u) diffusivity )
24588b783a1SJames Wright //   Xi(Pe)    = coth Pe - 1. / Pe (1. at large local Peclet number )
24688b783a1SJames Wright //   rho(A[i]) = spectral radius of the convective flux Jacobian i,
24788b783a1SJames Wright //               wave speed in direction i
24888b783a1SJames Wright // *****************************************************************************
24988b783a1SJames Wright CEED_QFUNCTION_HELPER void Tau_spatial(CeedScalar Tau_x[3],
25088b783a1SJames Wright                                        const CeedScalar dXdx[3][3], const CeedScalar u[3],
251*88626eedSJames Wright                                        /* const CeedScalar sound_speed, const CeedScalar c_tau) { */
252*88626eedSJames Wright                                        const CeedScalar sound_speed, const CeedScalar c_tau,
253*88626eedSJames Wright                                        const CeedScalar viscosity) {
254*88626eedSJames Wright   const CeedScalar mag_u_visc = sqrt(u[0]*u[0] +u[1]*u[1] +u[2]*u[2]) /
255*88626eedSJames Wright                                 (2*viscosity);
25688b783a1SJames Wright   for (int i=0; i<3; i++) {
25788b783a1SJames Wright     // length of element in direction i
25888b783a1SJames Wright     CeedScalar h = 2 / sqrt(dXdx[0][i]*dXdx[0][i] + dXdx[1][i]*dXdx[1][i] +
25988b783a1SJames Wright                             dXdx[2][i]*dXdx[2][i]);
260*88626eedSJames Wright     CeedScalar Pe = mag_u_visc*h;
261*88626eedSJames Wright     CeedScalar Xi = 1/tanh(Pe) - 1/Pe;
26288b783a1SJames Wright     // fastest wave in direction i
26388b783a1SJames Wright     CeedScalar fastest_wave = fabs(u[i]) + sound_speed;
264*88626eedSJames Wright     Tau_x[i] = c_tau * h * Xi / fastest_wave;
26588b783a1SJames Wright   }
26688b783a1SJames Wright }
26788b783a1SJames Wright 
26888b783a1SJames Wright // *****************************************************************************
26988b783a1SJames Wright // This QFunction sets a "still" initial condition for generic Newtonian IG problems
27088b783a1SJames Wright // *****************************************************************************
27188b783a1SJames Wright CEED_QFUNCTION(ICsNewtonianIG)(void *ctx, CeedInt Q,
27288b783a1SJames Wright                                const CeedScalar *const *in, CeedScalar *const *out) {
27388b783a1SJames Wright   // Inputs
27488b783a1SJames Wright   const CeedScalar (*X)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0];
27588b783a1SJames Wright 
27688b783a1SJames Wright   // Outputs
27788b783a1SJames Wright   CeedScalar (*q0)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0];
27888b783a1SJames Wright 
279*88626eedSJames Wright   // Context
280*88626eedSJames Wright   const SetupContext context = (SetupContext)ctx;
281*88626eedSJames Wright   const CeedScalar theta0    = context->theta0;
282*88626eedSJames Wright   const CeedScalar P0        = context->P0;
283*88626eedSJames Wright   const CeedScalar cv        = context->cv;
284*88626eedSJames Wright   const CeedScalar cp        = context->cp;
285*88626eedSJames Wright   const CeedScalar *g        = context->g;
286*88626eedSJames Wright   const CeedScalar Rd        = cp - cv;
287*88626eedSJames Wright 
28888b783a1SJames Wright   // Quadrature Point Loop
28988b783a1SJames Wright   CeedPragmaSIMD
29088b783a1SJames Wright   for (CeedInt i=0; i<Q; i++) {
29188b783a1SJames Wright     CeedScalar q[5] = {0.};
29288b783a1SJames Wright 
29388b783a1SJames Wright     // Setup
29488b783a1SJames Wright     // -- Coordinates
295*88626eedSJames Wright     const CeedScalar x[3] = {X[0][i], X[1][i], X[2][i]};
296*88626eedSJames Wright     const CeedScalar e_potential = -(g[0]*x[0] + g[1]*x[1] + g[2]*x[2]);
29788b783a1SJames Wright 
29888b783a1SJames Wright     // -- Density
299*88626eedSJames Wright     const CeedScalar rho = P0 / (Rd*theta0);
30088b783a1SJames Wright 
30188b783a1SJames Wright     // Initial Conditions
30288b783a1SJames Wright     q[0] = rho;
30388b783a1SJames Wright     q[1] = 0.0;
30488b783a1SJames Wright     q[2] = 0.0;
30588b783a1SJames Wright     q[3] = 0.0;
306*88626eedSJames Wright     q[4] = rho * (cv*theta0 + e_potential);
30788b783a1SJames Wright 
30888b783a1SJames Wright     for (CeedInt j=0; j<5; j++)
30988b783a1SJames Wright       q0[j][i] = q[j];
31088b783a1SJames Wright   } // End of Quadrature Point Loop
31188b783a1SJames Wright   return 0;
31288b783a1SJames Wright }
31388b783a1SJames Wright 
31488b783a1SJames Wright // *****************************************************************************
31588b783a1SJames Wright // This QFunction implements the following formulation of Navier-Stokes with
31688b783a1SJames Wright //   explicit time stepping method
31788b783a1SJames Wright //
31888b783a1SJames Wright // This is 3D compressible Navier-Stokes in conservation form with state
31988b783a1SJames Wright //   variables of density, momentum density, and total energy density.
32088b783a1SJames Wright //
32188b783a1SJames Wright // State Variables: q = ( rho, U1, U2, U3, E )
32288b783a1SJames Wright //   rho - Mass Density
32388b783a1SJames Wright //   Ui  - Momentum Density,      Ui = rho ui
32488b783a1SJames Wright //   E   - Total Energy Density,  E  = rho (cv T + (u u)/2 + g z)
32588b783a1SJames Wright //
32688b783a1SJames Wright // Navier-Stokes Equations:
32788b783a1SJames Wright //   drho/dt + div( U )                               = 0
32888b783a1SJames Wright //   dU/dt   + div( rho (u x u) + P I3 ) + rho g khat = div( Fu )
32988b783a1SJames Wright //   dE/dt   + div( (E + P) u )                       = div( Fe )
33088b783a1SJames Wright //
33188b783a1SJames Wright // Viscous Stress:
33288b783a1SJames Wright //   Fu = mu (grad( u ) + grad( u )^T + lambda div ( u ) I3)
33388b783a1SJames Wright //
33488b783a1SJames Wright // Thermal Stress:
33588b783a1SJames Wright //   Fe = u Fu + k grad( T )
336*88626eedSJames Wright // Equation of State
33788b783a1SJames Wright //   P = (gamma - 1) (E - rho (u u) / 2 - rho g z)
33888b783a1SJames Wright //
33988b783a1SJames Wright // Stabilization:
34088b783a1SJames Wright //   Tau = diag(TauC, TauM, TauM, TauM, TauE)
34188b783a1SJames Wright //     f1 = rho  sqrt(ui uj gij)
34288b783a1SJames Wright //     gij = dXi/dX * dXi/dX
34388b783a1SJames Wright //     TauC = Cc f1 / (8 gii)
34488b783a1SJames Wright //     TauM = min( 1 , 1 / f1 )
34588b783a1SJames Wright //     TauE = TauM / (Ce cv)
34688b783a1SJames Wright //
34788b783a1SJames Wright //  SU   = Galerkin + grad(v) . ( Ai^T * Tau * (Aj q,j) )
34888b783a1SJames Wright //
34988b783a1SJames Wright // Constants:
35088b783a1SJames Wright //   lambda = - 2 / 3,  From Stokes hypothesis
35188b783a1SJames Wright //   mu              ,  Dynamic viscosity
35288b783a1SJames Wright //   k               ,  Thermal conductivity
35388b783a1SJames Wright //   cv              ,  Specific heat, constant volume
35488b783a1SJames Wright //   cp              ,  Specific heat, constant pressure
35588b783a1SJames Wright //   g               ,  Gravity
35688b783a1SJames Wright //   gamma  = cp / cv,  Specific heat ratio
35788b783a1SJames Wright //
35888b783a1SJames Wright // We require the product of the inverse of the Jacobian (dXdx_j,k) and
35988b783a1SJames Wright // its transpose (dXdx_k,j) to properly compute integrals of the form:
36088b783a1SJames Wright // int( gradv gradu )
36188b783a1SJames Wright //
36288b783a1SJames Wright // *****************************************************************************
36388b783a1SJames Wright CEED_QFUNCTION(Newtonian)(void *ctx, CeedInt Q,
36488b783a1SJames Wright                           const CeedScalar *const *in, CeedScalar *const *out) {
36588b783a1SJames Wright   // *INDENT-OFF*
36688b783a1SJames Wright   // Inputs
36788b783a1SJames Wright   const CeedScalar (*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0],
36888b783a1SJames Wright                    (*dq)[5][CEED_Q_VLA] = (const CeedScalar(*)[5][CEED_Q_VLA])in[1],
36988b783a1SJames Wright                    (*q_data)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2],
37088b783a1SJames Wright                    (*x)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3];
37188b783a1SJames Wright   // Outputs
37288b783a1SJames Wright   CeedScalar (*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0],
37388b783a1SJames Wright              (*dv)[5][CEED_Q_VLA] = (CeedScalar(*)[5][CEED_Q_VLA])out[1];
37488b783a1SJames Wright   // *INDENT-ON*
37588b783a1SJames Wright 
37688b783a1SJames Wright   // Context
37788b783a1SJames Wright   NewtonianIdealGasContext context = (NewtonianIdealGasContext)ctx;
37888b783a1SJames Wright   const CeedScalar lambda = context->lambda;
37988b783a1SJames Wright   const CeedScalar mu     = context->mu;
38088b783a1SJames Wright   const CeedScalar k      = context->k;
38188b783a1SJames Wright   const CeedScalar cv     = context->cv;
38288b783a1SJames Wright   const CeedScalar cp     = context->cp;
383*88626eedSJames Wright   const CeedScalar *g     = context->g;
384*88626eedSJames Wright   const CeedScalar dt     = context->dt;
38588b783a1SJames Wright   const CeedScalar gamma  = cp / cv;
386*88626eedSJames Wright   const CeedScalar Rd     = cp - cv;
38788b783a1SJames Wright 
38888b783a1SJames Wright   CeedPragmaSIMD
38988b783a1SJames Wright   // Quadrature Point Loop
39088b783a1SJames Wright   for (CeedInt i=0; i<Q; i++) {
39188b783a1SJames Wright     // *INDENT-OFF*
39288b783a1SJames Wright     // Setup
39388b783a1SJames Wright     // -- Interp in
39488b783a1SJames Wright     const CeedScalar rho        =   q[0][i];
39588b783a1SJames Wright     const CeedScalar u[3]       =  {q[1][i] / rho,
39688b783a1SJames Wright                                     q[2][i] / rho,
39788b783a1SJames Wright                                     q[3][i] / rho
39888b783a1SJames Wright                                    };
39988b783a1SJames Wright     const CeedScalar E          =   q[4][i];
40088b783a1SJames Wright     // -- Grad in
40188b783a1SJames Wright     const CeedScalar drho[3]    =  {dq[0][0][i],
40288b783a1SJames Wright                                     dq[1][0][i],
40388b783a1SJames Wright                                     dq[2][0][i]
40488b783a1SJames Wright                                    };
40588b783a1SJames Wright     const CeedScalar dU[3][3]   = {{dq[0][1][i],
40688b783a1SJames Wright                                     dq[1][1][i],
40788b783a1SJames Wright                                     dq[2][1][i]},
40888b783a1SJames Wright                                    {dq[0][2][i],
40988b783a1SJames Wright                                     dq[1][2][i],
41088b783a1SJames Wright                                     dq[2][2][i]},
41188b783a1SJames Wright                                    {dq[0][3][i],
41288b783a1SJames Wright                                     dq[1][3][i],
41388b783a1SJames Wright                                     dq[2][3][i]}
41488b783a1SJames Wright                                   };
41588b783a1SJames Wright     const CeedScalar dE[3]      =  {dq[0][4][i],
41688b783a1SJames Wright                                     dq[1][4][i],
41788b783a1SJames Wright                                     dq[2][4][i]
41888b783a1SJames Wright                                    };
41988b783a1SJames Wright     // -- Interp-to-Interp q_data
42088b783a1SJames Wright     const CeedScalar wdetJ      =   q_data[0][i];
42188b783a1SJames Wright     // -- Interp-to-Grad q_data
42288b783a1SJames Wright     // ---- Inverse of change of coordinate matrix: X_i,j
42388b783a1SJames Wright     // *INDENT-OFF*
42488b783a1SJames Wright     const CeedScalar dXdx[3][3] = {{q_data[1][i],
42588b783a1SJames Wright                                     q_data[2][i],
42688b783a1SJames Wright                                     q_data[3][i]},
42788b783a1SJames Wright                                    {q_data[4][i],
42888b783a1SJames Wright                                     q_data[5][i],
42988b783a1SJames Wright                                     q_data[6][i]},
43088b783a1SJames Wright                                    {q_data[7][i],
43188b783a1SJames Wright                                     q_data[8][i],
43288b783a1SJames Wright                                     q_data[9][i]}
43388b783a1SJames Wright                                   };
434*88626eedSJames Wright     const CeedScalar x_i[3]       = {x[0][i], x[1][i], x[2][i]};
43588b783a1SJames Wright     // *INDENT-ON*
43688b783a1SJames Wright     // -- Grad-to-Grad q_data
43788b783a1SJames Wright     // dU/dx
43888b783a1SJames Wright     CeedScalar du[3][3] = {{0}};
43988b783a1SJames Wright     CeedScalar drhodx[3] = {0};
44088b783a1SJames Wright     CeedScalar dEdx[3] = {0};
44188b783a1SJames Wright     CeedScalar dUdx[3][3] = {{0}};
44288b783a1SJames Wright     CeedScalar dXdxdXdxT[3][3] = {{0}};
44388b783a1SJames Wright     for (int j=0; j<3; j++) {
44488b783a1SJames Wright       for (int k=0; k<3; k++) {
44588b783a1SJames Wright         du[j][k] = (dU[j][k] - drho[k]*u[j]) / rho;
44688b783a1SJames Wright         drhodx[j] += drho[k] * dXdx[k][j];
44788b783a1SJames Wright         dEdx[j] += dE[k] * dXdx[k][j];
44888b783a1SJames Wright         for (int l=0; l<3; l++) {
44988b783a1SJames Wright           dUdx[j][k] += dU[j][l] * dXdx[l][k];
45088b783a1SJames Wright           dXdxdXdxT[j][k] += dXdx[j][l]*dXdx[k][l];  //dXdx_j,k * dXdx_k,j
45188b783a1SJames Wright         }
45288b783a1SJames Wright       }
45388b783a1SJames Wright     }
45488b783a1SJames Wright     CeedScalar dudx[3][3] = {{0}};
45588b783a1SJames Wright     for (int j=0; j<3; j++)
45688b783a1SJames Wright       for (int k=0; k<3; k++)
45788b783a1SJames Wright         for (int l=0; l<3; l++)
45888b783a1SJames Wright           dudx[j][k] += du[j][l] * dXdx[l][k];
45988b783a1SJames Wright     // -- grad_T
46088b783a1SJames Wright     const CeedScalar grad_T[3]  = {(dEdx[0]/rho - E*drhodx[0]/(rho*rho) - /* *NOPAD* */
461*88626eedSJames Wright                                     (u[0]*dudx[0][0] + u[1]*dudx[1][0] + u[2]*dudx[2][0]) + g[0])/cv,
46288b783a1SJames Wright                                    (dEdx[1]/rho - E*drhodx[1]/(rho*rho) - /* *NOPAD* */
463*88626eedSJames Wright                                     (u[0]*dudx[0][1] + u[1]*dudx[1][1] + u[2]*dudx[2][1]) + g[1])/cv,
46488b783a1SJames Wright                                    (dEdx[2]/rho - E*drhodx[2]/(rho*rho) - /* *NOPAD* */
465*88626eedSJames Wright                                     (u[0]*dudx[0][2] + u[1]*dudx[1][2] + u[2]*dudx[2][2]) + g[2])/cv
46688b783a1SJames Wright                                   };
46788b783a1SJames Wright 
46888b783a1SJames Wright     // -- Fuvisc
46988b783a1SJames Wright     // ---- Symmetric 3x3 matrix
47088b783a1SJames Wright     const CeedScalar Fu[6]     =  {mu*(dudx[0][0] * (2 + lambda) + /* *NOPAD* */
47188b783a1SJames Wright                                        lambda * (dudx[1][1] + dudx[2][2])),
47288b783a1SJames Wright                                    mu*(dudx[0][1] + dudx[1][0]), /* *NOPAD* */
47388b783a1SJames Wright                                    mu*(dudx[0][2] + dudx[2][0]), /* *NOPAD* */
47488b783a1SJames Wright                                    mu*(dudx[1][1] * (2 + lambda) + /* *NOPAD* */
47588b783a1SJames Wright                                        lambda * (dudx[0][0] + dudx[2][2])),
47688b783a1SJames Wright                                    mu*(dudx[1][2] + dudx[2][1]), /* *NOPAD* */
47788b783a1SJames Wright                                    mu*(dudx[2][2] * (2 + lambda) + /* *NOPAD* */
47888b783a1SJames Wright                                        lambda * (dudx[0][0] + dudx[1][1]))
47988b783a1SJames Wright                                   };
48088b783a1SJames Wright     // -- Fevisc
48188b783a1SJames Wright     const CeedScalar Fe[3]     =  {u[0]*Fu[0] + u[1]*Fu[1] + u[2]*Fu[2] + /* *NOPAD* */
48288b783a1SJames Wright                                    k*grad_T[0], /* *NOPAD* */
48388b783a1SJames Wright                                    u[0]*Fu[1] + u[1]*Fu[3] + u[2]*Fu[4] + /* *NOPAD* */
48488b783a1SJames Wright                                    k*grad_T[1], /* *NOPAD* */
48588b783a1SJames Wright                                    u[0]*Fu[2] + u[1]*Fu[4] + u[2]*Fu[5] + /* *NOPAD* */
48688b783a1SJames Wright                                    k*grad_T[2] /* *NOPAD* */
48788b783a1SJames Wright                                   };
48888b783a1SJames Wright     // Pressure
48988b783a1SJames Wright     const CeedScalar
49088b783a1SJames Wright     E_kinetic   = 0.5 * rho * (u[0]*u[0] + u[1]*u[1] + u[2]*u[2]),
491*88626eedSJames Wright     E_potential = -rho*(g[0]*x_i[0] + g[1]*x_i[1] + g[2]*x_i[2]),
49288b783a1SJames Wright     E_internal  = E - E_kinetic - E_potential,
49388b783a1SJames Wright     P           = E_internal * (gamma - 1.); // P = pressure
49488b783a1SJames Wright 
49588b783a1SJames Wright     // jacob_F_conv[3][5][5] = dF(convective)/dq at each direction
49688b783a1SJames Wright     CeedScalar jacob_F_conv[3][5][5] = {{{0.}}};
497*88626eedSJames Wright     computeFluxJacobian_NS(jacob_F_conv, rho, u, E, gamma, g, x_i);
49888b783a1SJames Wright 
49988b783a1SJames Wright     // dqdx collects drhodx, dUdx and dEdx in one vector
50088b783a1SJames Wright     CeedScalar dqdx[5][3];
50188b783a1SJames Wright     for (int j=0; j<3; j++) {
50288b783a1SJames Wright       dqdx[0][j] = drhodx[j];
50388b783a1SJames Wright       dqdx[4][j] = dEdx[j];
50488b783a1SJames Wright       for (int k=0; k<3; k++)
50588b783a1SJames Wright         dqdx[k+1][j] = dUdx[k][j];
50688b783a1SJames Wright     }
50788b783a1SJames Wright 
50888b783a1SJames Wright     // strong_conv = dF/dq * dq/dx    (Strong convection)
50988b783a1SJames Wright     CeedScalar strong_conv[5] = {0};
51088b783a1SJames Wright     for (int j=0; j<3; j++)
51188b783a1SJames Wright       for (int k=0; k<5; k++)
51288b783a1SJames Wright         for (int l=0; l<5; l++)
51388b783a1SJames Wright           strong_conv[k] += jacob_F_conv[j][k][l] * dqdx[l][j];
51488b783a1SJames Wright 
51588b783a1SJames Wright     // Body force
516*88626eedSJames Wright     const CeedScalar body_force[5] = {0, rho *g[0], rho *g[1], rho *g[2], 0};
51788b783a1SJames Wright 
51888b783a1SJames Wright     // The Physics
51988b783a1SJames Wright     // Zero dv so all future terms can safely sum into it
52088b783a1SJames Wright     for (int j=0; j<5; j++)
52188b783a1SJames Wright       for (int k=0; k<3; k++)
52288b783a1SJames Wright         dv[k][j][i] = 0;
52388b783a1SJames Wright 
52488b783a1SJames Wright     // -- Density
52588b783a1SJames Wright     // ---- u rho
52688b783a1SJames Wright     for (int j=0; j<3; j++)
52788b783a1SJames Wright       dv[j][0][i]  += wdetJ*(rho*u[0]*dXdx[j][0] + rho*u[1]*dXdx[j][1] +
52888b783a1SJames Wright                              rho*u[2]*dXdx[j][2]);
52988b783a1SJames Wright     // -- Momentum
53088b783a1SJames Wright     // ---- rho (u x u) + P I3
53188b783a1SJames Wright     for (int j=0; j<3; j++)
53288b783a1SJames Wright       for (int k=0; k<3; k++)
53388b783a1SJames Wright         dv[k][j+1][i]  += wdetJ*((rho*u[j]*u[0] + (j==0?P:0))*dXdx[k][0] +
53488b783a1SJames Wright                                  (rho*u[j]*u[1] + (j==1?P:0))*dXdx[k][1] +
53588b783a1SJames Wright                                  (rho*u[j]*u[2] + (j==2?P:0))*dXdx[k][2]);
53688b783a1SJames Wright     // ---- Fuvisc
53788b783a1SJames Wright     const CeedInt Fuviscidx[3][3] = {{0, 1, 2}, {1, 3, 4}, {2, 4, 5}}; // symmetric matrix indices
53888b783a1SJames Wright     for (int j=0; j<3; j++)
53988b783a1SJames Wright       for (int k=0; k<3; k++)
54088b783a1SJames Wright         dv[k][j+1][i] -= wdetJ*(Fu[Fuviscidx[j][0]]*dXdx[k][0] +
54188b783a1SJames Wright                                 Fu[Fuviscidx[j][1]]*dXdx[k][1] +
54288b783a1SJames Wright                                 Fu[Fuviscidx[j][2]]*dXdx[k][2]);
54388b783a1SJames Wright     // -- Total Energy Density
54488b783a1SJames Wright     // ---- (E + P) u
54588b783a1SJames Wright     for (int j=0; j<3; j++)
54688b783a1SJames Wright       dv[j][4][i]  += wdetJ * (E + P) * (u[0]*dXdx[j][0] + u[1]*dXdx[j][1] +
54788b783a1SJames Wright                                          u[2]*dXdx[j][2]);
54888b783a1SJames Wright     // ---- Fevisc
54988b783a1SJames Wright     for (int j=0; j<3; j++)
55088b783a1SJames Wright       dv[j][4][i] -= wdetJ * (Fe[0]*dXdx[j][0] + Fe[1]*dXdx[j][1] +
55188b783a1SJames Wright                               Fe[2]*dXdx[j][2]);
55288b783a1SJames Wright     // Body Force
55388b783a1SJames Wright     for (int j=0; j<5; j++)
55488b783a1SJames Wright       v[j][i] = wdetJ * body_force[j];
55588b783a1SJames Wright 
556*88626eedSJames Wright     // Spatial Stabilization
557*88626eedSJames Wright     // -- Not used in favor of diagonal tau. Kept for future testing
558*88626eedSJames Wright     // const CeedScalar sound_speed = sqrt(gamma * P / rho);
559*88626eedSJames Wright     // CeedScalar Tau_x[3] = {0.};
560*88626eedSJames Wright     // Tau_spatial(Tau_x, dXdx, u, sound_speed, context->c_tau, mu);
56188b783a1SJames Wright 
562*88626eedSJames Wright     // -- Stabilization method: none, SU, or SUPG
563*88626eedSJames Wright     CeedScalar stab[5][3] = {{0.}};
564*88626eedSJames Wright     CeedScalar tau_strong_conv[5] = {0.}, tau_strong_conv_conservative[5] = {0};
565*88626eedSJames Wright     CeedScalar Tau_d[3] = {0.};
56688b783a1SJames Wright     switch (context->stabilization) {
56788b783a1SJames Wright     case STAB_NONE:        // Galerkin
56888b783a1SJames Wright       break;
56988b783a1SJames Wright     case STAB_SU:        // SU
570*88626eedSJames Wright       Tau_diagPrim(Tau_d, dXdx, u, cv, context, mu, dt, rho);
571*88626eedSJames Wright       tau_strong_conv[0] = Tau_d[0] * strong_conv[0];
572*88626eedSJames Wright       tau_strong_conv[1] = Tau_d[1] * strong_conv[1];
573*88626eedSJames Wright       tau_strong_conv[2] = Tau_d[1] * strong_conv[2];
574*88626eedSJames Wright       tau_strong_conv[3] = Tau_d[1] * strong_conv[3];
575*88626eedSJames Wright       tau_strong_conv[4] = Tau_d[2] * strong_conv[4];
576*88626eedSJames Wright       PrimitiveToConservative_fwd(rho, u, E, Rd, cv, tau_strong_conv,
577*88626eedSJames Wright                                   tau_strong_conv_conservative);
57888b783a1SJames Wright       for (int j=0; j<3; j++)
57988b783a1SJames Wright         for (int k=0; k<5; k++)
58088b783a1SJames Wright           for (int l=0; l<5; l++)
581*88626eedSJames Wright             stab[k][j] += jacob_F_conv[j][k][l] * tau_strong_conv_conservative[l];
58288b783a1SJames Wright 
58388b783a1SJames Wright       for (int j=0; j<5; j++)
58488b783a1SJames Wright         for (int k=0; k<3; k++)
58588b783a1SJames Wright           dv[k][j][i] -= wdetJ*(stab[j][0] * dXdx[k][0] +
58688b783a1SJames Wright                                 stab[j][1] * dXdx[k][1] +
58788b783a1SJames Wright                                 stab[j][2] * dXdx[k][2]);
58888b783a1SJames Wright       break;
58988b783a1SJames Wright     case STAB_SUPG:        // SUPG is not implemented for explicit scheme
59088b783a1SJames Wright       break;
59188b783a1SJames Wright     }
59288b783a1SJames Wright 
59388b783a1SJames Wright   } // End Quadrature Point Loop
59488b783a1SJames Wright 
59588b783a1SJames Wright   // Return
59688b783a1SJames Wright   return 0;
59788b783a1SJames Wright }
59888b783a1SJames Wright 
59988b783a1SJames Wright // *****************************************************************************
60088b783a1SJames Wright // This QFunction implements the Navier-Stokes equations (mentioned above) with
60188b783a1SJames Wright //   implicit time stepping method
60288b783a1SJames Wright //
60388b783a1SJames Wright //  SU   = Galerkin + grad(v) . ( Ai^T * Tau * (Aj q,j) )
60488b783a1SJames Wright //  SUPG = Galerkin + grad(v) . ( Ai^T * Tau * (q_dot + Aj q,j - body force) )
60588b783a1SJames Wright //                                       (diffussive terms will be added later)
60688b783a1SJames Wright //
60788b783a1SJames Wright // *****************************************************************************
60888b783a1SJames Wright CEED_QFUNCTION(IFunction_Newtonian)(void *ctx, CeedInt Q,
60988b783a1SJames Wright                                     const CeedScalar *const *in,
61088b783a1SJames Wright                                     CeedScalar *const *out) {
61188b783a1SJames Wright   // *INDENT-OFF*
61288b783a1SJames Wright   // Inputs
61388b783a1SJames Wright   const CeedScalar (*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0],
61488b783a1SJames Wright                    (*dq)[5][CEED_Q_VLA] = (const CeedScalar(*)[5][CEED_Q_VLA])in[1],
61588b783a1SJames Wright                    (*q_dot)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2],
61688b783a1SJames Wright                    (*q_data)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3],
61788b783a1SJames Wright                    (*x)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[4];
61888b783a1SJames Wright   // Outputs
61988b783a1SJames Wright   CeedScalar (*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0],
62088b783a1SJames Wright              (*dv)[5][CEED_Q_VLA] = (CeedScalar(*)[5][CEED_Q_VLA])out[1];
62188b783a1SJames Wright   // *INDENT-ON*
62288b783a1SJames Wright   // Context
62388b783a1SJames Wright   NewtonianIdealGasContext context = (NewtonianIdealGasContext)ctx;
62488b783a1SJames Wright   const CeedScalar lambda = context->lambda;
62588b783a1SJames Wright   const CeedScalar mu     = context->mu;
62688b783a1SJames Wright   const CeedScalar k      = context->k;
62788b783a1SJames Wright   const CeedScalar cv     = context->cv;
62888b783a1SJames Wright   const CeedScalar cp     = context->cp;
629*88626eedSJames Wright   const CeedScalar *g     = context->g;
630*88626eedSJames Wright   const CeedScalar dt     = context->dt;
63188b783a1SJames Wright   const CeedScalar gamma  = cp / cv;
632*88626eedSJames Wright   const CeedScalar Rd     = cp-cv;
63388b783a1SJames Wright 
63488b783a1SJames Wright   CeedPragmaSIMD
63588b783a1SJames Wright   // Quadrature Point Loop
63688b783a1SJames Wright   for (CeedInt i=0; i<Q; i++) {
63788b783a1SJames Wright     // Setup
63888b783a1SJames Wright     // -- Interp in
63988b783a1SJames Wright     const CeedScalar rho        =   q[0][i];
64088b783a1SJames Wright     const CeedScalar u[3]       =  {q[1][i] / rho,
64188b783a1SJames Wright                                     q[2][i] / rho,
64288b783a1SJames Wright                                     q[3][i] / rho
64388b783a1SJames Wright                                    };
64488b783a1SJames Wright     const CeedScalar E          =   q[4][i];
64588b783a1SJames Wright     // -- Grad in
64688b783a1SJames Wright     const CeedScalar drho[3]    =  {dq[0][0][i],
64788b783a1SJames Wright                                     dq[1][0][i],
64888b783a1SJames Wright                                     dq[2][0][i]
64988b783a1SJames Wright                                    };
65088b783a1SJames Wright     // *INDENT-OFF*
65188b783a1SJames Wright     const CeedScalar dU[3][3]   = {{dq[0][1][i],
65288b783a1SJames Wright                                     dq[1][1][i],
65388b783a1SJames Wright                                     dq[2][1][i]},
65488b783a1SJames Wright                                    {dq[0][2][i],
65588b783a1SJames Wright                                     dq[1][2][i],
65688b783a1SJames Wright                                     dq[2][2][i]},
65788b783a1SJames Wright                                    {dq[0][3][i],
65888b783a1SJames Wright                                     dq[1][3][i],
65988b783a1SJames Wright                                     dq[2][3][i]}
66088b783a1SJames Wright                                   };
66188b783a1SJames Wright     // *INDENT-ON*
66288b783a1SJames Wright     const CeedScalar dE[3]      =  {dq[0][4][i],
66388b783a1SJames Wright                                     dq[1][4][i],
66488b783a1SJames Wright                                     dq[2][4][i]
66588b783a1SJames Wright                                    };
66688b783a1SJames Wright     // -- Interp-to-Interp q_data
66788b783a1SJames Wright     const CeedScalar wdetJ      =   q_data[0][i];
66888b783a1SJames Wright     // -- Interp-to-Grad q_data
66988b783a1SJames Wright     // ---- Inverse of change of coordinate matrix: X_i,j
67088b783a1SJames Wright     // *INDENT-OFF*
67188b783a1SJames Wright     const CeedScalar dXdx[3][3] = {{q_data[1][i],
67288b783a1SJames Wright                                     q_data[2][i],
67388b783a1SJames Wright                                     q_data[3][i]},
67488b783a1SJames Wright                                    {q_data[4][i],
67588b783a1SJames Wright                                     q_data[5][i],
67688b783a1SJames Wright                                     q_data[6][i]},
67788b783a1SJames Wright                                    {q_data[7][i],
67888b783a1SJames Wright                                     q_data[8][i],
67988b783a1SJames Wright                                     q_data[9][i]}
68088b783a1SJames Wright                                   };
681*88626eedSJames Wright     const CeedScalar x_i[3]     = {x[0][i], x[1][i], x[2][i]};
68288b783a1SJames Wright     // *INDENT-ON*
68388b783a1SJames Wright     // -- Grad-to-Grad q_data
68488b783a1SJames Wright     // dU/dx
68588b783a1SJames Wright     CeedScalar du[3][3] = {{0}};
68688b783a1SJames Wright     CeedScalar drhodx[3] = {0};
68788b783a1SJames Wright     CeedScalar dEdx[3] = {0};
68888b783a1SJames Wright     CeedScalar dUdx[3][3] = {{0}};
68988b783a1SJames Wright     CeedScalar dXdxdXdxT[3][3] = {{0}};
69088b783a1SJames Wright     for (int j=0; j<3; j++) {
69188b783a1SJames Wright       for (int k=0; k<3; k++) {
69288b783a1SJames Wright         du[j][k] = (dU[j][k] - drho[k]*u[j]) / rho;
69388b783a1SJames Wright         drhodx[j] += drho[k] * dXdx[k][j];
69488b783a1SJames Wright         dEdx[j] += dE[k] * dXdx[k][j];
69588b783a1SJames Wright         for (int l=0; l<3; l++) {
69688b783a1SJames Wright           dUdx[j][k] += dU[j][l] * dXdx[l][k];
69788b783a1SJames Wright           dXdxdXdxT[j][k] += dXdx[j][l]*dXdx[k][l];  //dXdx_j,k * dXdx_k,j
69888b783a1SJames Wright         }
69988b783a1SJames Wright       }
70088b783a1SJames Wright     }
70188b783a1SJames Wright     CeedScalar dudx[3][3] = {{0}};
70288b783a1SJames Wright     for (int j=0; j<3; j++)
70388b783a1SJames Wright       for (int k=0; k<3; k++)
70488b783a1SJames Wright         for (int l=0; l<3; l++)
70588b783a1SJames Wright           dudx[j][k] += du[j][l] * dXdx[l][k];
70688b783a1SJames Wright     // -- grad_T
70788b783a1SJames Wright     const CeedScalar grad_T[3]  = {(dEdx[0]/rho - E*drhodx[0]/(rho*rho) - /* *NOPAD* */
708*88626eedSJames Wright                                     (u[0]*dudx[0][0] + u[1]*dudx[1][0] + u[2]*dudx[2][0]) + g[0])/cv,
70988b783a1SJames Wright                                    (dEdx[1]/rho - E*drhodx[1]/(rho*rho) - /* *NOPAD* */
710*88626eedSJames Wright                                     (u[0]*dudx[0][1] + u[1]*dudx[1][1] + u[2]*dudx[2][1]) + g[1])/cv,
71188b783a1SJames Wright                                    (dEdx[2]/rho - E*drhodx[2]/(rho*rho) - /* *NOPAD* */
712*88626eedSJames Wright                                     (u[0]*dudx[0][2] + u[1]*dudx[1][2] + u[2]*dudx[2][2]) + g[2])/cv
71388b783a1SJames Wright                                   };
71488b783a1SJames Wright     // -- Fuvisc
71588b783a1SJames Wright     // ---- Symmetric 3x3 matrix
71688b783a1SJames Wright     const CeedScalar Fu[6]     =  {mu*(dudx[0][0] * (2 + lambda) + /* *NOPAD* */
71788b783a1SJames Wright                                        lambda * (dudx[1][1] + dudx[2][2])),
71888b783a1SJames Wright                                    mu*(dudx[0][1] + dudx[1][0]), /* *NOPAD* */
71988b783a1SJames Wright                                    mu*(dudx[0][2] + dudx[2][0]), /* *NOPAD* */
72088b783a1SJames Wright                                    mu*(dudx[1][1] * (2 + lambda) + /* *NOPAD* */
72188b783a1SJames Wright                                        lambda * (dudx[0][0] + dudx[2][2])),
72288b783a1SJames Wright                                    mu*(dudx[1][2] + dudx[2][1]), /* *NOPAD* */
72388b783a1SJames Wright                                    mu*(dudx[2][2] * (2 + lambda) + /* *NOPAD* */
72488b783a1SJames Wright                                        lambda * (dudx[0][0] + dudx[1][1]))
72588b783a1SJames Wright                                   };
72688b783a1SJames Wright     // -- Fevisc
72788b783a1SJames Wright     const CeedScalar Fe[3]     =  {u[0]*Fu[0] + u[1]*Fu[1] + u[2]*Fu[2] + /* *NOPAD* */
72888b783a1SJames Wright                                    k*grad_T[0], /* *NOPAD* */
72988b783a1SJames Wright                                    u[0]*Fu[1] + u[1]*Fu[3] + u[2]*Fu[4] + /* *NOPAD* */
73088b783a1SJames Wright                                    k*grad_T[1], /* *NOPAD* */
73188b783a1SJames Wright                                    u[0]*Fu[2] + u[1]*Fu[4] + u[2]*Fu[5] + /* *NOPAD* */
73288b783a1SJames Wright                                    k*grad_T[2] /* *NOPAD* */
73388b783a1SJames Wright                                   };
73488b783a1SJames Wright     // Pressure
73588b783a1SJames Wright     const CeedScalar
73688b783a1SJames Wright     E_kinetic   = 0.5 * rho * (u[0]*u[0] + u[1]*u[1] + u[2]*u[2]),
737*88626eedSJames Wright     E_potential = -rho*(g[0]*x_i[0] + g[1]*x_i[1] + g[2]*x_i[2]),
73888b783a1SJames Wright     E_internal  = E - E_kinetic - E_potential,
73988b783a1SJames Wright     P           = E_internal * (gamma - 1.); // P = pressure
74088b783a1SJames Wright 
74188b783a1SJames Wright     // jacob_F_conv[3][5][5] = dF(convective)/dq at each direction
74288b783a1SJames Wright     CeedScalar jacob_F_conv[3][5][5] = {{{0.}}};
743*88626eedSJames Wright     computeFluxJacobian_NS(jacob_F_conv, rho, u, E, gamma, g, x_i);
74488b783a1SJames Wright 
74588b783a1SJames Wright     // dqdx collects drhodx, dUdx and dEdx in one vector
74688b783a1SJames Wright     CeedScalar dqdx[5][3];
74788b783a1SJames Wright     for (int j=0; j<3; j++) {
74888b783a1SJames Wright       dqdx[0][j] = drhodx[j];
74988b783a1SJames Wright       dqdx[4][j] = dEdx[j];
75088b783a1SJames Wright       for (int k=0; k<3; k++)
75188b783a1SJames Wright         dqdx[k+1][j] = dUdx[k][j];
75288b783a1SJames Wright     }
75388b783a1SJames Wright     // strong_conv = dF/dq * dq/dx    (Strong convection)
75488b783a1SJames Wright     CeedScalar strong_conv[5] = {0};
75588b783a1SJames Wright     for (int j=0; j<3; j++)
75688b783a1SJames Wright       for (int k=0; k<5; k++)
75788b783a1SJames Wright         for (int l=0; l<5; l++)
75888b783a1SJames Wright           strong_conv[k] += jacob_F_conv[j][k][l] * dqdx[l][j];
75988b783a1SJames Wright 
76088b783a1SJames Wright     // Body force
761*88626eedSJames Wright     const CeedScalar body_force[5] = {0, rho *g[0], rho *g[1], rho *g[2], 0};
76288b783a1SJames Wright 
76388b783a1SJames Wright     // Strong residual
76488b783a1SJames Wright     CeedScalar strong_res[5];
76588b783a1SJames Wright     for (int j=0; j<5; j++)
76688b783a1SJames Wright       strong_res[j] = q_dot[j][i] + strong_conv[j] - body_force[j];
76788b783a1SJames Wright 
76888b783a1SJames Wright     // The Physics
76988b783a1SJames Wright     //-----mass matrix
77088b783a1SJames Wright     for (int j=0; j<5; j++)
77188b783a1SJames Wright       v[j][i] = wdetJ*q_dot[j][i];
77288b783a1SJames Wright 
77388b783a1SJames Wright     // Zero dv so all future terms can safely sum into it
77488b783a1SJames Wright     for (int j=0; j<5; j++)
77588b783a1SJames Wright       for (int k=0; k<3; k++)
77688b783a1SJames Wright         dv[k][j][i] = 0;
77788b783a1SJames Wright 
77888b783a1SJames Wright     // -- Density
77988b783a1SJames Wright     // ---- u rho
78088b783a1SJames Wright     for (int j=0; j<3; j++)
78188b783a1SJames Wright       dv[j][0][i]  -= wdetJ*(rho*u[0]*dXdx[j][0] + rho*u[1]*dXdx[j][1] +
78288b783a1SJames Wright                              rho*u[2]*dXdx[j][2]);
78388b783a1SJames Wright     // -- Momentum
78488b783a1SJames Wright     // ---- rho (u x u) + P I3
78588b783a1SJames Wright     for (int j=0; j<3; j++)
78688b783a1SJames Wright       for (int k=0; k<3; k++)
78788b783a1SJames Wright         dv[k][j+1][i]  -= wdetJ*((rho*u[j]*u[0] + (j==0?P:0))*dXdx[k][0] +
78888b783a1SJames Wright                                  (rho*u[j]*u[1] + (j==1?P:0))*dXdx[k][1] +
78988b783a1SJames Wright                                  (rho*u[j]*u[2] + (j==2?P:0))*dXdx[k][2]);
79088b783a1SJames Wright     // ---- Fuvisc
79188b783a1SJames Wright     const CeedInt Fuviscidx[3][3] = {{0, 1, 2}, {1, 3, 4}, {2, 4, 5}}; // symmetric matrix indices
79288b783a1SJames Wright     for (int j=0; j<3; j++)
79388b783a1SJames Wright       for (int k=0; k<3; k++)
79488b783a1SJames Wright         dv[k][j+1][i] += wdetJ*(Fu[Fuviscidx[j][0]]*dXdx[k][0] +
79588b783a1SJames Wright                                 Fu[Fuviscidx[j][1]]*dXdx[k][1] +
79688b783a1SJames Wright                                 Fu[Fuviscidx[j][2]]*dXdx[k][2]);
79788b783a1SJames Wright     // -- Total Energy Density
79888b783a1SJames Wright     // ---- (E + P) u
79988b783a1SJames Wright     for (int j=0; j<3; j++)
80088b783a1SJames Wright       dv[j][4][i]  -= wdetJ * (E + P) * (u[0]*dXdx[j][0] + u[1]*dXdx[j][1] +
80188b783a1SJames Wright                                          u[2]*dXdx[j][2]);
80288b783a1SJames Wright     // ---- Fevisc
80388b783a1SJames Wright     for (int j=0; j<3; j++)
80488b783a1SJames Wright       dv[j][4][i] += wdetJ * (Fe[0]*dXdx[j][0] + Fe[1]*dXdx[j][1] +
80588b783a1SJames Wright                               Fe[2]*dXdx[j][2]);
80688b783a1SJames Wright     // Body Force
80788b783a1SJames Wright     for (int j=0; j<5; j++)
80888b783a1SJames Wright       v[j][i] -= wdetJ*body_force[j];
80988b783a1SJames Wright 
810*88626eedSJames Wright     // Spatial Stabilization
811*88626eedSJames Wright     // -- Not used in favor of diagonal tau. Kept for future testing
812*88626eedSJames Wright     // const CeedScalar sound_speed = sqrt(gamma * P / rho);
813*88626eedSJames Wright     // CeedScalar Tau_x[3] = {0.};
814*88626eedSJames Wright     // Tau_spatial(Tau_x, dXdx, u, sound_speed, c_tau, mu);
81588b783a1SJames Wright 
81688b783a1SJames Wright     // -- Stabilization method: none, SU, or SUPG
817*88626eedSJames Wright     CeedScalar stab[5][3] = {{0.}};
818*88626eedSJames Wright     CeedScalar tau_strong_res[5] = {0.}, tau_strong_res_conservative[5] = {0};
819*88626eedSJames Wright     CeedScalar tau_strong_conv[5] = {0.}, tau_strong_conv_conservative[5] = {0};
820*88626eedSJames Wright     CeedScalar Tau_d[3] = {0.};
82188b783a1SJames Wright     switch (context->stabilization) {
82288b783a1SJames Wright     case STAB_NONE:        // Galerkin
82388b783a1SJames Wright       break;
82488b783a1SJames Wright     case STAB_SU:        // SU
825*88626eedSJames Wright       Tau_diagPrim(Tau_d, dXdx, u, cv, context, mu, dt, rho);
826*88626eedSJames Wright       tau_strong_conv[0] = Tau_d[0] * strong_conv[0];
827*88626eedSJames Wright       tau_strong_conv[1] = Tau_d[1] * strong_conv[1];
828*88626eedSJames Wright       tau_strong_conv[2] = Tau_d[1] * strong_conv[2];
829*88626eedSJames Wright       tau_strong_conv[3] = Tau_d[1] * strong_conv[3];
830*88626eedSJames Wright       tau_strong_conv[4] = Tau_d[2] * strong_conv[4];
831*88626eedSJames Wright       PrimitiveToConservative_fwd(rho, u, E, Rd, cv, tau_strong_conv,
832*88626eedSJames Wright                                   tau_strong_conv_conservative);
83388b783a1SJames Wright       for (int j=0; j<3; j++)
83488b783a1SJames Wright         for (int k=0; k<5; k++)
83588b783a1SJames Wright           for (int l=0; l<5; l++)
836*88626eedSJames Wright             stab[k][j] += jacob_F_conv[j][k][l] * tau_strong_conv_conservative[l];
83788b783a1SJames Wright 
83888b783a1SJames Wright       for (int j=0; j<5; j++)
83988b783a1SJames Wright         for (int k=0; k<3; k++)
84088b783a1SJames Wright           dv[k][j][i] += wdetJ*(stab[j][0] * dXdx[k][0] +
84188b783a1SJames Wright                                 stab[j][1] * dXdx[k][1] +
84288b783a1SJames Wright                                 stab[j][2] * dXdx[k][2]);
84388b783a1SJames Wright       break;
84488b783a1SJames Wright     case STAB_SUPG:        // SUPG
845*88626eedSJames Wright       Tau_diagPrim(Tau_d, dXdx, u, cv, context, mu, dt, rho);
846*88626eedSJames Wright       tau_strong_res[0] = Tau_d[0] * strong_res[0];
847*88626eedSJames Wright       tau_strong_res[1] = Tau_d[1] * strong_res[1];
848*88626eedSJames Wright       tau_strong_res[2] = Tau_d[1] * strong_res[2];
849*88626eedSJames Wright       tau_strong_res[3] = Tau_d[1] * strong_res[3];
850*88626eedSJames Wright       tau_strong_res[4] = Tau_d[2] * strong_res[4];
851*88626eedSJames Wright // Alternate route (useful later with primitive variable code)
852*88626eedSJames Wright // this function was verified against PHASTA for as IC that was as close as possible
853*88626eedSJames Wright //    computeFluxJacobian_NSp(jacob_F_conv_p, rho, u, E, Rd, cv);
854*88626eedSJames Wright // it has also been verified to compute a correct through the following
855*88626eedSJames Wright //   stab[k][j] += jacob_F_conv_p[j][k][l] * tau_strong_res[l] // flux Jacobian wrt primitive
856*88626eedSJames Wright // applied in the triple loop below
857*88626eedSJames Wright //  However, it is more flops than using the existing Jacobian wrt q after q_{,Y} viz
858*88626eedSJames Wright       PrimitiveToConservative_fwd(rho, u, E, Rd, cv, tau_strong_res,
859*88626eedSJames Wright                                   tau_strong_res_conservative);
86088b783a1SJames Wright       for (int j=0; j<3; j++)
86188b783a1SJames Wright         for (int k=0; k<5; k++)
86288b783a1SJames Wright           for (int l=0; l<5; l++)
863*88626eedSJames Wright             stab[k][j] += jacob_F_conv[j][k][l] * tau_strong_res_conservative[l];
86488b783a1SJames Wright 
86588b783a1SJames Wright       for (int j=0; j<5; j++)
86688b783a1SJames Wright         for (int k=0; k<3; k++)
86788b783a1SJames Wright           dv[k][j][i] += wdetJ*(stab[j][0] * dXdx[k][0] +
86888b783a1SJames Wright                                 stab[j][1] * dXdx[k][1] +
86988b783a1SJames Wright                                 stab[j][2] * dXdx[k][2]);
87088b783a1SJames Wright       break;
87188b783a1SJames Wright     }
87288b783a1SJames Wright 
87388b783a1SJames Wright   } // End Quadrature Point Loop
87488b783a1SJames Wright 
87588b783a1SJames Wright   // Return
87688b783a1SJames Wright   return 0;
87788b783a1SJames Wright }
87888b783a1SJames Wright // *****************************************************************************
87988b783a1SJames Wright #endif // newtonian_h
880