honee/qfunctions/newtonian.h

727da7e7SJeremy L Thompson// Copyright (c) 2017-2022, Lawrence Livermore National Security, LLC and other CEED contributors.
727da7e7SJeremy L Thompson// All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
3a8779fbSJames Wright//
727da7e7SJeremy L Thompson// SPDX-License-Identifier: BSD-2-Clause
3a8779fbSJames Wright//
727da7e7SJeremy L Thompson// This file is part of CEED:  http://github.com/ceed
3a8779fbSJames Wright
3a8779fbSJames Wright/// @file
3a8779fbSJames Wright/// Operator for Navier-Stokes example using PETSc
3a8779fbSJames Wright
3a8779fbSJames Wright
3a8779fbSJames Wright#ifndef newtonian_h
3a8779fbSJames Wright#define newtonian_h
3a8779fbSJames Wright
3a8779fbSJames Wright#include <math.h>
3a8779fbSJames Wright#include <ceed.h>
15a3537eSJed Brown#include "newtonian_types.h"
475b2820SJames Wright#include "newtonian_state.h"
3a8779fbSJames Wright
3a8779fbSJames Wright#ifndef M_PI
3a8779fbSJames Wright#define M_PI    3.14159265358979323846
3a8779fbSJames Wright#endif
3a8779fbSJames Wright
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames Wright// Helper function for computing flux Jacobian
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames WrightCEED_QFUNCTION_HELPER void computeFluxJacobian_NS(CeedScalar dF[3][5][5],
3a8779fbSJames Wright    const CeedScalar rho, const CeedScalar u[3], const CeedScalar E,
bb8a0c61SJames Wright    const CeedScalar gamma, const CeedScalar g[3], const CeedScalar x[3]) {
3a8779fbSJames Wright  CeedScalar u_sq = u[0]*u[0] + u[1]*u[1] + u[2]*u[2]; // Velocity square
bb8a0c61SJames Wright  CeedScalar e_potential = -(g[0]*x[0] + g[1]*x[1] + g[2]*x[2]);
3a8779fbSJames Wright  for (CeedInt i=0; i<3; i++) { // Jacobian matrices for 3 directions
3a8779fbSJames Wright    for (CeedInt j=0; j<3; j++) { // Rows of each Jacobian matrix
bb8a0c61SJames Wright      dF[i][j+1][0] = ((i==j) ? ((gamma-1.)*(u_sq/2. - e_potential)) : 0.) -
bb8a0c61SJames Wright                      u[i]*u[j];
3a8779fbSJames Wright      for (CeedInt k=0; k<3; k++) { // Columns of each Jacobian matrix
3a8779fbSJames Wright        dF[i][0][k+1]   = ((i==k) ? 1. : 0.);
3a8779fbSJames Wright        dF[i][j+1][k+1] = ((j==k) ? u[i] : 0.) +
3a8779fbSJames Wright                          ((i==k) ? u[j] : 0.) -
3a8779fbSJames Wright                          ((i==j) ? u[k] : 0.) * (gamma-1.);
3a8779fbSJames Wright        dF[i][4][k+1]   = ((i==k) ? (E*gamma/rho - (gamma-1.)*u_sq/2.) : 0.) -
3a8779fbSJames Wright                          (gamma-1.)*u[i]*u[k];
3a8779fbSJames Wright      }
3a8779fbSJames Wright      dF[i][j+1][4] = ((i==j) ? (gamma-1.) : 0.);
3a8779fbSJames Wright    }
3a8779fbSJames Wright    dF[i][4][0] = u[i] * ((gamma-1.)*u_sq - E*gamma/rho);
3a8779fbSJames Wright    dF[i][4][4] = u[i] * gamma;
3a8779fbSJames Wright  }
3a8779fbSJames Wright}
3a8779fbSJames Wright
3a8779fbSJames Wright// *****************************************************************************
bb8a0c61SJames Wright// Helper function for computing flux Jacobian of Primitive variables
bb8a0c61SJames Wright// *****************************************************************************
bb8a0c61SJames WrightCEED_QFUNCTION_HELPER void computeFluxJacobian_NSp(CeedScalar dF[3][5][5],
bb8a0c61SJames Wright    const CeedScalar rho, const CeedScalar u[3], const CeedScalar E,
bb8a0c61SJames Wright    const CeedScalar Rd, const CeedScalar cv) {
bb8a0c61SJames Wright  CeedScalar u_sq = u[0]*u[0] + u[1]*u[1] + u[2]*u[2]; // Velocity square
bb8a0c61SJames Wright  // TODO Add in gravity's contribution
bb8a0c61SJames Wright
bb8a0c61SJames Wright  CeedScalar T    = ( E / rho - u_sq / 2. ) / cv;
bb8a0c61SJames Wright  CeedScalar drdT = -rho / T;
bb8a0c61SJames Wright  CeedScalar drdP = 1. / ( Rd * T);
bb8a0c61SJames Wright  CeedScalar etot =  E / rho ;
bb8a0c61SJames Wright  CeedScalar e2p  = drdP * etot + 1. ;
bb8a0c61SJames Wright  CeedScalar e3p  = ( E  + rho * Rd * T );
bb8a0c61SJames Wright  CeedScalar e4p  = drdT * etot + rho * cv ;
bb8a0c61SJames Wright
bb8a0c61SJames Wright  for (CeedInt i=0; i<3; i++) { // Jacobian matrices for 3 directions
bb8a0c61SJames Wright    for (CeedInt j=0; j<3; j++) { // j counts F^{m_j}
bb8a0c61SJames Wright//        [row][col] of A_i
bb8a0c61SJames Wright      dF[i][j+1][0] = drdP * u[i] * u[j] + ((i==j) ? 1. : 0.); // F^{{m_j} wrt p
bb8a0c61SJames Wright      for (CeedInt k=0; k<3; k++) { // k counts the wrt vel_k
2acc7cbcSKenneth E. Jansen        dF[i][0][k+1]   =  ((i==k) ? rho  : 0.);   // F^c wrt u_k
bb8a0c61SJames Wright        dF[i][j+1][k+1] = (((j==k) ? u[i] : 0.) +  // F^m_j wrt u_k
bb8a0c61SJames Wright                           ((i==k) ? u[j] : 0.) ) * rho;
bb8a0c61SJames Wright        dF[i][4][k+1]   = rho * u[i] * u[k]
bb8a0c61SJames Wright                          + ((i==k) ? e3p  : 0.) ; // F^e wrt u_k
bb8a0c61SJames Wright      }
bb8a0c61SJames Wright      dF[i][j+1][4] = drdT * u[i] * u[j]; // F^{m_j} wrt T
bb8a0c61SJames Wright    }
bb8a0c61SJames Wright    dF[i][4][0] = u[i] * e2p; // F^e wrt p
bb8a0c61SJames Wright    dF[i][4][4] = u[i] * e4p; // F^e wrt T
bb8a0c61SJames Wright    dF[i][0][0] = u[i] * drdP; // F^c wrt p
bb8a0c61SJames Wright    dF[i][0][4] = u[i] * drdT; // F^c wrt T
bb8a0c61SJames Wright  }
bb8a0c61SJames Wright}
bb8a0c61SJames Wright
bb8a0c61SJames WrightCEED_QFUNCTION_HELPER void PrimitiveToConservative_fwd(const CeedScalar rho,
bb8a0c61SJames Wright    const CeedScalar u[3], const CeedScalar E, const CeedScalar Rd,
bb8a0c61SJames Wright    const CeedScalar cv, const CeedScalar dY[5], CeedScalar dU[5]) {
bb8a0c61SJames Wright  CeedScalar u_sq = u[0]*u[0] + u[1]*u[1] + u[2]*u[2];
bb8a0c61SJames Wright  CeedScalar T    = ( E / rho - u_sq / 2. ) / cv;
bb8a0c61SJames Wright  CeedScalar drdT = -rho / T;
bb8a0c61SJames Wright  CeedScalar drdP = 1. / ( Rd * T);
bb8a0c61SJames Wright  dU[0] = drdP * dY[0] + drdT * dY[4];
bb8a0c61SJames Wright  CeedScalar de_kinetic = 0;
493642f1SJames Wright  for (CeedInt i=0; i<3; i++) {
bb8a0c61SJames Wright    dU[1+i] = dU[0] * u[i] + rho * dY[1+i];
bb8a0c61SJames Wright    de_kinetic += u[i] * dY[1+i];
bb8a0c61SJames Wright  }
bb8a0c61SJames Wright  dU[4] = rho * cv * dY[4] + dU[0] * cv * T // internal energy: rho * e
bb8a0c61SJames Wright          + rho * de_kinetic + .5 * dU[0] * u_sq; // kinetic energy: .5 * rho * |u|^2
bb8a0c61SJames Wright}
bb8a0c61SJames Wright
bb8a0c61SJames Wright// *****************************************************************************
bb8a0c61SJames Wright// Helper function for computing Tau elements (stabilization constant)
bb8a0c61SJames Wright//   Model from:
bb8a0c61SJames Wright//     PHASTA
bb8a0c61SJames Wright//
bb8a0c61SJames Wright//   Tau[i] = itau=0 which is diagonal-Shakib (3 values still but not spatial)
bb8a0c61SJames Wright//
bb8a0c61SJames Wright// Where NOT UPDATED YET
bb8a0c61SJames Wright// *****************************************************************************
bb8a0c61SJames WrightCEED_QFUNCTION_HELPER void Tau_diagPrim(CeedScalar Tau_d[3],
bb8a0c61SJames Wright                                        const CeedScalar dXdx[3][3], const CeedScalar u[3],
bb8a0c61SJames Wright                                        const CeedScalar cv, const NewtonianIdealGasContext newt_ctx,
bb8a0c61SJames Wright                                        const CeedScalar mu, const CeedScalar dt,
bb8a0c61SJames Wright                                        const CeedScalar rho) {
bb8a0c61SJames Wright  // Context
bb8a0c61SJames Wright  const CeedScalar Ctau_t = newt_ctx->Ctau_t;
bb8a0c61SJames Wright  const CeedScalar Ctau_v = newt_ctx->Ctau_v;
bb8a0c61SJames Wright  const CeedScalar Ctau_C = newt_ctx->Ctau_C;
bb8a0c61SJames Wright  const CeedScalar Ctau_M = newt_ctx->Ctau_M;
bb8a0c61SJames Wright  const CeedScalar Ctau_E = newt_ctx->Ctau_E;
bb8a0c61SJames Wright  CeedScalar gijd[6];
bb8a0c61SJames Wright  CeedScalar tau;
bb8a0c61SJames Wright  CeedScalar dts;
bb8a0c61SJames Wright  CeedScalar fact;
bb8a0c61SJames Wright
bb8a0c61SJames Wright  //*INDENT-OFF*
bb8a0c61SJames Wright  gijd[0] =   dXdx[0][0] * dXdx[0][0]
bb8a0c61SJames Wright            + dXdx[1][0] * dXdx[1][0]
bb8a0c61SJames Wright            + dXdx[2][0] * dXdx[2][0];
bb8a0c61SJames Wright
bb8a0c61SJames Wright  gijd[1] =   dXdx[0][0] * dXdx[0][1]
bb8a0c61SJames Wright            + dXdx[1][0] * dXdx[1][1]
bb8a0c61SJames Wright            + dXdx[2][0] * dXdx[2][1];
bb8a0c61SJames Wright
bb8a0c61SJames Wright  gijd[2] =   dXdx[0][1] * dXdx[0][1]
bb8a0c61SJames Wright            + dXdx[1][1] * dXdx[1][1]
bb8a0c61SJames Wright            + dXdx[2][1] * dXdx[2][1];
bb8a0c61SJames Wright
bb8a0c61SJames Wright  gijd[3] =   dXdx[0][0] * dXdx[0][2]
bb8a0c61SJames Wright            + dXdx[1][0] * dXdx[1][2]
bb8a0c61SJames Wright            + dXdx[2][0] * dXdx[2][2];
bb8a0c61SJames Wright
bb8a0c61SJames Wright  gijd[4] =   dXdx[0][1] * dXdx[0][2]
bb8a0c61SJames Wright            + dXdx[1][1] * dXdx[1][2]
bb8a0c61SJames Wright            + dXdx[2][1] * dXdx[2][2];
bb8a0c61SJames Wright
bb8a0c61SJames Wright  gijd[5] =   dXdx[0][2] * dXdx[0][2]
bb8a0c61SJames Wright            + dXdx[1][2] * dXdx[1][2]
bb8a0c61SJames Wright            + dXdx[2][2] * dXdx[2][2];
bb8a0c61SJames Wright  //*INDENT-ON*
bb8a0c61SJames Wright
bb8a0c61SJames Wright  dts = Ctau_t / dt ;
bb8a0c61SJames Wright
bb8a0c61SJames Wright  tau = rho*rho*((4. * dts * dts)
bb8a0c61SJames Wright                 + u[0] * ( u[0] * gijd[0] + 2. * ( u[1] * gijd[1] + u[2] * gijd[3]))
bb8a0c61SJames Wright                 + u[1] * ( u[1] * gijd[2] + 2. *   u[2] * gijd[4])
bb8a0c61SJames Wright                 + u[2] *   u[2] * gijd[5])
bb8a0c61SJames Wright        + Ctau_v* mu * mu *
bb8a0c61SJames Wright        (gijd[0]*gijd[0] + gijd[2]*gijd[2] + gijd[5]*gijd[5] +
bb8a0c61SJames Wright         + 2. * (gijd[1]*gijd[1] + gijd[3]*gijd[3] + gijd[4]*gijd[4]));
bb8a0c61SJames Wright
bb8a0c61SJames Wright  fact=sqrt(tau);
bb8a0c61SJames Wright
bb8a0c61SJames Wright  Tau_d[0] = Ctau_C * fact / (rho*(gijd[0] + gijd[2] + gijd[5]))*0.125;
bb8a0c61SJames Wright
bb8a0c61SJames Wright  Tau_d[1] = Ctau_M / fact;
bb8a0c61SJames Wright  Tau_d[2] = Ctau_E / ( fact * cv );
bb8a0c61SJames Wright
bb8a0c61SJames Wright// consider putting back the way I initially had it  Ctau_E * Tau_d[1] /cv
bb8a0c61SJames Wright//  to avoid a division if the compiler is smart enough to see that cv IS
bb8a0c61SJames Wright// a constant that it could invert once for all elements
bb8a0c61SJames Wright// but in that case energy tau is scaled by the product of Ctau_E * Ctau_M
bb8a0c61SJames Wright// OR we could absorb cv into Ctau_E but this puts more burden on user to
bb8a0c61SJames Wright// know how to change constants with a change of fluid or units.  Same for
bb8a0c61SJames Wright// Ctau_v * mu * mu IF AND ONLY IF we don't add viscosity law =f(T)
bb8a0c61SJames Wright}
bb8a0c61SJames Wright
bb8a0c61SJames Wright// *****************************************************************************
3a8779fbSJames Wright// This QFunction sets a "still" initial condition for generic Newtonian IG problems
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames WrightCEED_QFUNCTION(ICsNewtonianIG)(void *ctx, CeedInt Q,
3a8779fbSJames Wright                               const CeedScalar *const *in, CeedScalar *const *out) {
3a8779fbSJames Wright  // Inputs
3a8779fbSJames Wright  const CeedScalar (*X)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0];
3a8779fbSJames Wright
3a8779fbSJames Wright  // Outputs
3a8779fbSJames Wright  CeedScalar (*q0)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0];
3a8779fbSJames Wright
bb8a0c61SJames Wright  // Context
bb8a0c61SJames Wright  const SetupContext context = (SetupContext)ctx;
bb8a0c61SJames Wright  const CeedScalar theta0    = context->theta0;
bb8a0c61SJames Wright  const CeedScalar P0        = context->P0;
bb8a0c61SJames Wright  const CeedScalar cv        = context->cv;
bb8a0c61SJames Wright  const CeedScalar cp        = context->cp;
bb8a0c61SJames Wright  const CeedScalar *g        = context->g;
bb8a0c61SJames Wright  const CeedScalar Rd        = cp - cv;
bb8a0c61SJames Wright
3a8779fbSJames Wright  // Quadrature Point Loop
3a8779fbSJames Wright  CeedPragmaSIMD
3a8779fbSJames Wright  for (CeedInt i=0; i<Q; i++) {
3a8779fbSJames Wright    CeedScalar q[5] = {0.};
3a8779fbSJames Wright
3a8779fbSJames Wright    // Setup
3a8779fbSJames Wright    // -- Coordinates
bb8a0c61SJames Wright    const CeedScalar x[3] = {X[0][i], X[1][i], X[2][i]};
bb8a0c61SJames Wright    const CeedScalar e_potential = -(g[0]*x[0] + g[1]*x[1] + g[2]*x[2]);
3a8779fbSJames Wright
3a8779fbSJames Wright    // -- Density
bb8a0c61SJames Wright    const CeedScalar rho = P0 / (Rd*theta0);
3a8779fbSJames Wright
3a8779fbSJames Wright    // Initial Conditions
3a8779fbSJames Wright    q[0] = rho;
3a8779fbSJames Wright    q[1] = 0.0;
3a8779fbSJames Wright    q[2] = 0.0;
3a8779fbSJames Wright    q[3] = 0.0;
bb8a0c61SJames Wright    q[4] = rho * (cv*theta0 + e_potential);
3a8779fbSJames Wright
3a8779fbSJames Wright    for (CeedInt j=0; j<5; j++)
3a8779fbSJames Wright      q0[j][i] = q[j];
3a8779fbSJames Wright  } // End of Quadrature Point Loop
3a8779fbSJames Wright  return 0;
3a8779fbSJames Wright}
3a8779fbSJames Wright
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames Wright// This QFunction implements the following formulation of Navier-Stokes with
3a8779fbSJames Wright//   explicit time stepping method
3a8779fbSJames Wright//
3a8779fbSJames Wright// This is 3D compressible Navier-Stokes in conservation form with state
3a8779fbSJames Wright//   variables of density, momentum density, and total energy density.
3a8779fbSJames Wright//
3a8779fbSJames Wright// State Variables: q = ( rho, U1, U2, U3, E )
3a8779fbSJames Wright//   rho - Mass Density
3a8779fbSJames Wright//   Ui  - Momentum Density,      Ui = rho ui
3a8779fbSJames Wright//   E   - Total Energy Density,  E  = rho (cv T + (u u)/2 + g z)
3a8779fbSJames Wright//
3a8779fbSJames Wright// Navier-Stokes Equations:
3a8779fbSJames Wright//   drho/dt + div( U )                               = 0
3a8779fbSJames Wright//   dU/dt   + div( rho (u x u) + P I3 ) + rho g khat = div( Fu )
3a8779fbSJames Wright//   dE/dt   + div( (E + P) u )                       = div( Fe )
3a8779fbSJames Wright//
3a8779fbSJames Wright// Viscous Stress:
3a8779fbSJames Wright//   Fu = mu (grad( u ) + grad( u )^T + lambda div ( u ) I3)
3a8779fbSJames Wright//
3a8779fbSJames Wright// Thermal Stress:
3a8779fbSJames Wright//   Fe = u Fu + k grad( T )
bb8a0c61SJames Wright// Equation of State
3a8779fbSJames Wright//   P = (gamma - 1) (E - rho (u u) / 2 - rho g z)
3a8779fbSJames Wright//
3a8779fbSJames Wright// Stabilization:
3a8779fbSJames Wright//   Tau = diag(TauC, TauM, TauM, TauM, TauE)
3a8779fbSJames Wright//     f1 = rho  sqrt(ui uj gij)
3a8779fbSJames Wright//     gij = dXi/dX * dXi/dX
3a8779fbSJames Wright//     TauC = Cc f1 / (8 gii)
3a8779fbSJames Wright//     TauM = min( 1 , 1 / f1 )
3a8779fbSJames Wright//     TauE = TauM / (Ce cv)
3a8779fbSJames Wright//
3a8779fbSJames Wright//  SU   = Galerkin + grad(v) . ( Ai^T * Tau * (Aj q,j) )
3a8779fbSJames Wright//
3a8779fbSJames Wright// Constants:
3a8779fbSJames Wright//   lambda = - 2 / 3,  From Stokes hypothesis
3a8779fbSJames Wright//   mu              ,  Dynamic viscosity
3a8779fbSJames Wright//   k               ,  Thermal conductivity
3a8779fbSJames Wright//   cv              ,  Specific heat, constant volume
3a8779fbSJames Wright//   cp              ,  Specific heat, constant pressure
3a8779fbSJames Wright//   g               ,  Gravity
3a8779fbSJames Wright//   gamma  = cp / cv,  Specific heat ratio
3a8779fbSJames Wright//
3a8779fbSJames Wright// We require the product of the inverse of the Jacobian (dXdx_j,k) and
3a8779fbSJames Wright// its transpose (dXdx_k,j) to properly compute integrals of the form:
3a8779fbSJames Wright// int( gradv gradu )
3a8779fbSJames Wright//
3a8779fbSJames Wright// *****************************************************************************
c1a52365SJed BrownCEED_QFUNCTION(RHSFunction_Newtonian)(void *ctx, CeedInt Q,
3a8779fbSJames Wright                                      const CeedScalar *const *in, CeedScalar *const *out) {
3a8779fbSJames Wright  // *INDENT-OFF*
3a8779fbSJames Wright  // Inputs
3a8779fbSJames Wright  const CeedScalar (*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0],
752f40e3SJed Brown                   (*Grad_q)[5][CEED_Q_VLA] = (const CeedScalar(*)[5][CEED_Q_VLA])in[1],
3a8779fbSJames Wright                   (*q_data)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2],
3a8779fbSJames Wright                   (*x)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3];
3a8779fbSJames Wright  // Outputs
3a8779fbSJames Wright  CeedScalar (*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0],
752f40e3SJed Brown             (*Grad_v)[5][CEED_Q_VLA] = (CeedScalar(*)[5][CEED_Q_VLA])out[1];
3a8779fbSJames Wright  // *INDENT-ON*
3a8779fbSJames Wright
3a8779fbSJames Wright  // Context
3a8779fbSJames Wright  NewtonianIdealGasContext context = (NewtonianIdealGasContext)ctx;
3a8779fbSJames Wright  const CeedScalar mu     = context->mu;
3a8779fbSJames Wright  const CeedScalar cv     = context->cv;
3a8779fbSJames Wright  const CeedScalar cp     = context->cp;
bb8a0c61SJames Wright  const CeedScalar *g     = context->g;
bb8a0c61SJames Wright  const CeedScalar dt     = context->dt;
3a8779fbSJames Wright  const CeedScalar gamma  = cp / cv;
bb8a0c61SJames Wright  const CeedScalar Rd     = cp - cv;
3a8779fbSJames Wright
3a8779fbSJames Wright  CeedPragmaSIMD
3a8779fbSJames Wright  // Quadrature Point Loop
3a8779fbSJames Wright  for (CeedInt i=0; i<Q; i++) {
c1a52365SJed Brown    CeedScalar U[5];
c1a52365SJed Brown    for (int j=0; j<5; j++) U[j] = q[j][i];
c1a52365SJed Brown    const CeedScalar x_i[3] = {x[0][i], x[1][i], x[2][i]};
c1a52365SJed Brown    State s = StateFromU(context, U, x_i);
c1a52365SJed Brown
3a8779fbSJames Wright    // -- Interp-to-Interp q_data
3a8779fbSJames Wright    const CeedScalar wdetJ      =   q_data[0][i];
3a8779fbSJames Wright    // -- Interp-to-Grad q_data
3a8779fbSJames Wright    // ---- Inverse of change of coordinate matrix: X_i,j
3a8779fbSJames Wright    // *INDENT-OFF*
3a8779fbSJames Wright    const CeedScalar dXdx[3][3] = {{q_data[1][i],
3a8779fbSJames Wright                                    q_data[2][i],
3a8779fbSJames Wright                                    q_data[3][i]},
3a8779fbSJames Wright                                   {q_data[4][i],
3a8779fbSJames Wright                                    q_data[5][i],
3a8779fbSJames Wright                                    q_data[6][i]},
3a8779fbSJames Wright                                   {q_data[7][i],
3a8779fbSJames Wright                                    q_data[8][i],
3a8779fbSJames Wright                                    q_data[9][i]}
3a8779fbSJames Wright                                  };
3a8779fbSJames Wright    // *INDENT-ON*
3a8779fbSJames Wright
c1a52365SJed Brown    State grad_s[3];
eef2387dSJed Brown    for (CeedInt j=0; j<3; j++) {
2f7ce6c1SJed Brown      CeedScalar dx_i[3] = {0}, dU[5];
2556a851SJed Brown      for (CeedInt k=0; k<5; k++)
2556a851SJed Brown        dU[k] = Grad_q[0][k][i] * dXdx[0][j] +
2556a851SJed Brown                Grad_q[1][k][i] * dXdx[1][j] +
2556a851SJed Brown                Grad_q[2][k][i] * dXdx[2][j];
c1a52365SJed Brown      dx_i[j] = 1.;
2f7ce6c1SJed Brown      grad_s[j] = StateFromU_fwd(context, s, dU, x_i, dx_i);
c1a52365SJed Brown    }
c1a52365SJed Brown
c1a52365SJed Brown    CeedScalar strain_rate[6], kmstress[6], stress[3][3], Fe[3];
c1a52365SJed Brown    KMStrainRate(grad_s, strain_rate);
c1a52365SJed Brown    NewtonianStress(context, strain_rate, kmstress);
c1a52365SJed Brown    KMUnpack(kmstress, stress);
c1a52365SJed Brown    ViscousEnergyFlux(context, s.Y, grad_s, stress, Fe);
c1a52365SJed Brown
c1a52365SJed Brown    StateConservative F_inviscid[3];
c1a52365SJed Brown    FluxInviscid(context, s, F_inviscid);
c1a52365SJed Brown
c1a52365SJed Brown    // Total flux
c1a52365SJed Brown    CeedScalar Flux[5][3];
eef2387dSJed Brown    for (CeedInt j=0; j<3; j++) {
c1a52365SJed Brown      Flux[0][j] = F_inviscid[j].density;
eef2387dSJed Brown      for (CeedInt k=0; k<3; k++)
c1a52365SJed Brown        Flux[k+1][j] = F_inviscid[j].momentum[k] - stress[k][j];
c1a52365SJed Brown      Flux[4][j] = F_inviscid[j].E_total + Fe[j];
c1a52365SJed Brown    }
c1a52365SJed Brown
eef2387dSJed Brown    for (CeedInt j=0; j<3; j++) {
eef2387dSJed Brown      for (CeedInt k=0; k<5; k++) {
752f40e3SJed Brown        Grad_v[j][k][i] = wdetJ * (dXdx[j][0] * Flux[k][0] +
c1a52365SJed Brown                                   dXdx[j][1] * Flux[k][1] +
c1a52365SJed Brown                                   dXdx[j][2] * Flux[k][2]);
c1a52365SJed Brown      }
c1a52365SJed Brown    }
c1a52365SJed Brown
c1a52365SJed Brown    const CeedScalar body_force[5] = {0, s.U.density *g[0], s.U.density *g[1], s.U.density *g[2], 0};
c1a52365SJed Brown    for (int j=0; j<5; j++)
c1a52365SJed Brown      v[j][i] = wdetJ * body_force[j];
3a8779fbSJames Wright
3a8779fbSJames Wright    // jacob_F_conv[3][5][5] = dF(convective)/dq at each direction
c1a52365SJed Brown    CeedScalar jacob_F_conv[3][5][5] = {0};
c1a52365SJed Brown    computeFluxJacobian_NS(jacob_F_conv, s.U.density, s.Y.velocity, s.U.E_total,
c1a52365SJed Brown                           gamma, g, x_i);
c1a52365SJed Brown    CeedScalar grad_U[5][3];
493642f1SJames Wright    for (CeedInt j=0; j<3; j++) {
c1a52365SJed Brown      grad_U[0][j] = grad_s[j].U.density;
eef2387dSJed Brown      for (CeedInt k=0; k<3; k++) grad_U[k+1][j] = grad_s[j].U.momentum[k];
c1a52365SJed Brown      grad_U[4][j] = grad_s[j].U.E_total;
3a8779fbSJames Wright    }
3a8779fbSJames Wright
3a8779fbSJames Wright    // strong_conv = dF/dq * dq/dx    (Strong convection)
3a8779fbSJames Wright    CeedScalar strong_conv[5] = {0};
493642f1SJames Wright    for (CeedInt j=0; j<3; j++)
493642f1SJames Wright      for (CeedInt k=0; k<5; k++)
493642f1SJames Wright        for (CeedInt l=0; l<5; l++)
c1a52365SJed Brown          strong_conv[k] += jacob_F_conv[j][k][l] * grad_U[l][j];
3a8779fbSJames Wright
bb8a0c61SJames Wright    // -- Stabilization method: none, SU, or SUPG
bb8a0c61SJames Wright    CeedScalar stab[5][3] = {{0.}};
bb8a0c61SJames Wright    CeedScalar tau_strong_conv[5] = {0.}, tau_strong_conv_conservative[5] = {0};
bb8a0c61SJames Wright    CeedScalar Tau_d[3] = {0.};
3a8779fbSJames Wright    switch (context->stabilization) {
3a8779fbSJames Wright    case STAB_NONE:        // Galerkin
3a8779fbSJames Wright      break;
3a8779fbSJames Wright    case STAB_SU:        // SU
c1a52365SJed Brown      Tau_diagPrim(Tau_d, dXdx, s.Y.velocity, cv, context, mu, dt, s.U.density);
bb8a0c61SJames Wright      tau_strong_conv[0] = Tau_d[0] * strong_conv[0];
bb8a0c61SJames Wright      tau_strong_conv[1] = Tau_d[1] * strong_conv[1];
bb8a0c61SJames Wright      tau_strong_conv[2] = Tau_d[1] * strong_conv[2];
bb8a0c61SJames Wright      tau_strong_conv[3] = Tau_d[1] * strong_conv[3];
bb8a0c61SJames Wright      tau_strong_conv[4] = Tau_d[2] * strong_conv[4];
c1a52365SJed Brown      PrimitiveToConservative_fwd(s.U.density, s.Y.velocity, s.U.E_total, Rd, cv,
c1a52365SJed Brown                                  tau_strong_conv,
bb8a0c61SJames Wright                                  tau_strong_conv_conservative);
493642f1SJames Wright      for (CeedInt j=0; j<3; j++)
493642f1SJames Wright        for (CeedInt k=0; k<5; k++)
493642f1SJames Wright          for (CeedInt l=0; l<5; l++)
bb8a0c61SJames Wright            stab[k][j] += jacob_F_conv[j][k][l] * tau_strong_conv_conservative[l];
3a8779fbSJames Wright
493642f1SJames Wright      for (CeedInt j=0; j<5; j++)
493642f1SJames Wright        for (CeedInt k=0; k<3; k++)
752f40e3SJed Brown          Grad_v[k][j][i] -= wdetJ*(stab[j][0] * dXdx[k][0] +
3a8779fbSJames Wright                                    stab[j][1] * dXdx[k][1] +
3a8779fbSJames Wright                                    stab[j][2] * dXdx[k][2]);
3a8779fbSJames Wright      break;
3a8779fbSJames Wright    case STAB_SUPG:        // SUPG is not implemented for explicit scheme
3a8779fbSJames Wright      break;
3a8779fbSJames Wright    }
3a8779fbSJames Wright
3a8779fbSJames Wright  } // End Quadrature Point Loop
3a8779fbSJames Wright
3a8779fbSJames Wright  // Return
3a8779fbSJames Wright  return 0;
3a8779fbSJames Wright}
3a8779fbSJames Wright
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames Wright// This QFunction implements the Navier-Stokes equations (mentioned above) with
3a8779fbSJames Wright//   implicit time stepping method
3a8779fbSJames Wright//
3a8779fbSJames Wright//  SU   = Galerkin + grad(v) . ( Ai^T * Tau * (Aj q,j) )
3a8779fbSJames Wright//  SUPG = Galerkin + grad(v) . ( Ai^T * Tau * (q_dot + Aj q,j - body force) )
3a8779fbSJames Wright//                                       (diffussive terms will be added later)
3a8779fbSJames Wright//
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames WrightCEED_QFUNCTION(IFunction_Newtonian)(void *ctx, CeedInt Q,
3a8779fbSJames Wright                                    const CeedScalar *const *in,
3a8779fbSJames Wright                                    CeedScalar *const *out) {
3a8779fbSJames Wright  // *INDENT-OFF*
3a8779fbSJames Wright  // Inputs
3a8779fbSJames Wright  const CeedScalar (*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0],
752f40e3SJed Brown                   (*Grad_q)[5][CEED_Q_VLA] = (const CeedScalar(*)[5][CEED_Q_VLA])in[1],
3a8779fbSJames Wright                   (*q_dot)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2],
3a8779fbSJames Wright                   (*q_data)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3],
3a8779fbSJames Wright                   (*x)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[4];
3a8779fbSJames Wright  // Outputs
3a8779fbSJames Wright  CeedScalar (*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0],
752f40e3SJed Brown             (*Grad_v)[5][CEED_Q_VLA] = (CeedScalar(*)[5][CEED_Q_VLA])out[1],
752f40e3SJed Brown             (*jac_data)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[2];
3a8779fbSJames Wright  // *INDENT-ON*
3a8779fbSJames Wright  // Context
3a8779fbSJames Wright  NewtonianIdealGasContext context = (NewtonianIdealGasContext)ctx;
3a8779fbSJames Wright  const CeedScalar mu     = context->mu;
3a8779fbSJames Wright  const CeedScalar cv     = context->cv;
3a8779fbSJames Wright  const CeedScalar cp     = context->cp;
bb8a0c61SJames Wright  const CeedScalar *g     = context->g;
bb8a0c61SJames Wright  const CeedScalar dt     = context->dt;
3a8779fbSJames Wright  const CeedScalar gamma  = cp / cv;
bb8a0c61SJames Wright  const CeedScalar Rd     = cp-cv;
3a8779fbSJames Wright
3a8779fbSJames Wright  CeedPragmaSIMD
3a8779fbSJames Wright  // Quadrature Point Loop
3a8779fbSJames Wright  for (CeedInt i=0; i<Q; i++) {
c1a52365SJed Brown    CeedScalar U[5];
eef2387dSJed Brown    for (CeedInt j=0; j<5; j++) U[j] = q[j][i];
c1a52365SJed Brown    const CeedScalar x_i[3] = {x[0][i], x[1][i], x[2][i]};
c1a52365SJed Brown    State s = StateFromU(context, U, x_i);
c1a52365SJed Brown
3a8779fbSJames Wright    // -- Interp-to-Interp q_data
3a8779fbSJames Wright    const CeedScalar wdetJ      =   q_data[0][i];
3a8779fbSJames Wright    // -- Interp-to-Grad q_data
3a8779fbSJames Wright    // ---- Inverse of change of coordinate matrix: X_i,j
3a8779fbSJames Wright    // *INDENT-OFF*
3a8779fbSJames Wright    const CeedScalar dXdx[3][3] = {{q_data[1][i],
3a8779fbSJames Wright                                    q_data[2][i],
3a8779fbSJames Wright                                    q_data[3][i]},
3a8779fbSJames Wright                                   {q_data[4][i],
3a8779fbSJames Wright                                    q_data[5][i],
3a8779fbSJames Wright                                    q_data[6][i]},
3a8779fbSJames Wright                                   {q_data[7][i],
3a8779fbSJames Wright                                    q_data[8][i],
3a8779fbSJames Wright                                    q_data[9][i]}
3a8779fbSJames Wright                                  };
3a8779fbSJames Wright    // *INDENT-ON*
c1a52365SJed Brown    State grad_s[3];
493642f1SJames Wright    for (CeedInt j=0; j<3; j++) {
2f7ce6c1SJed Brown      CeedScalar dx_i[3] = {0}, dU[5];
2556a851SJed Brown      for (CeedInt k=0; k<5; k++)
2556a851SJed Brown        dU[k] = Grad_q[0][k][i] * dXdx[0][j] +
2556a851SJed Brown                Grad_q[1][k][i] * dXdx[1][j] +
2556a851SJed Brown                Grad_q[2][k][i] * dXdx[2][j];
c1a52365SJed Brown      dx_i[j] = 1.;
2f7ce6c1SJed Brown      grad_s[j] = StateFromU_fwd(context, s, dU, x_i, dx_i);
3a8779fbSJames Wright    }
c1a52365SJed Brown
c1a52365SJed Brown    CeedScalar strain_rate[6], kmstress[6], stress[3][3], Fe[3];
c1a52365SJed Brown    KMStrainRate(grad_s, strain_rate);
c1a52365SJed Brown    NewtonianStress(context, strain_rate, kmstress);
c1a52365SJed Brown    KMUnpack(kmstress, stress);
c1a52365SJed Brown    ViscousEnergyFlux(context, s.Y, grad_s, stress, Fe);
c1a52365SJed Brown
c1a52365SJed Brown    StateConservative F_inviscid[3];
c1a52365SJed Brown    FluxInviscid(context, s, F_inviscid);
c1a52365SJed Brown
c1a52365SJed Brown
c1a52365SJed Brown    // Total flux
c1a52365SJed Brown    CeedScalar Flux[5][3];
eef2387dSJed Brown    for (CeedInt j=0; j<3; j++) {
c1a52365SJed Brown      Flux[0][j] = F_inviscid[j].density;
493642f1SJames Wright      for (CeedInt k=0; k<3; k++)
c1a52365SJed Brown        Flux[k+1][j] = F_inviscid[j].momentum[k] - stress[k][j];
c1a52365SJed Brown      Flux[4][j] = F_inviscid[j].E_total + Fe[j];
c1a52365SJed Brown    }
c1a52365SJed Brown
eef2387dSJed Brown    for (CeedInt j=0; j<3; j++) {
eef2387dSJed Brown      for (CeedInt k=0; k<5; k++) {
752f40e3SJed Brown        Grad_v[j][k][i] = -wdetJ * (dXdx[j][0] * Flux[k][0] +
c1a52365SJed Brown                                    dXdx[j][1] * Flux[k][1] +
c1a52365SJed Brown                                    dXdx[j][2] * Flux[k][2]);
c1a52365SJed Brown      }
c1a52365SJed Brown    }
c1a52365SJed Brown
c1a52365SJed Brown    const CeedScalar body_force[5] = {0, s.U.density *g[0], s.U.density *g[1], s.U.density *g[2], 0};
eef2387dSJed Brown    for (CeedInt j=0; j<5; j++)
c1a52365SJed Brown      v[j][i] = wdetJ * (q_dot[j][i] - body_force[j]);
3a8779fbSJames Wright
3a8779fbSJames Wright    // jacob_F_conv[3][5][5] = dF(convective)/dq at each direction
c1a52365SJed Brown    CeedScalar jacob_F_conv[3][5][5] = {0};
c1a52365SJed Brown    computeFluxJacobian_NS(jacob_F_conv, s.U.density, s.Y.velocity, s.U.E_total,
c1a52365SJed Brown                           gamma, g, x_i);
c1a52365SJed Brown    CeedScalar grad_U[5][3];
493642f1SJames Wright    for (CeedInt j=0; j<3; j++) {
c1a52365SJed Brown      grad_U[0][j] = grad_s[j].U.density;
eef2387dSJed Brown      for (CeedInt k=0; k<3; k++) grad_U[k+1][j] = grad_s[j].U.momentum[k];
c1a52365SJed Brown      grad_U[4][j] = grad_s[j].U.E_total;
3a8779fbSJames Wright    }
c1a52365SJed Brown
3a8779fbSJames Wright    // strong_conv = dF/dq * dq/dx    (Strong convection)
3a8779fbSJames Wright    CeedScalar strong_conv[5] = {0};
493642f1SJames Wright    for (CeedInt j=0; j<3; j++)
493642f1SJames Wright      for (CeedInt k=0; k<5; k++)
493642f1SJames Wright        for (CeedInt l=0; l<5; l++)
c1a52365SJed Brown          strong_conv[k] += jacob_F_conv[j][k][l] * grad_U[l][j];
3a8779fbSJames Wright
3a8779fbSJames Wright    // Strong residual
3a8779fbSJames Wright    CeedScalar strong_res[5];
493642f1SJames Wright    for (CeedInt j=0; j<5; j++)
3a8779fbSJames Wright      strong_res[j] = q_dot[j][i] + strong_conv[j] - body_force[j];
3a8779fbSJames Wright
3a8779fbSJames Wright    // -- Stabilization method: none, SU, or SUPG
bb8a0c61SJames Wright    CeedScalar stab[5][3] = {{0.}};
bb8a0c61SJames Wright    CeedScalar tau_strong_res[5] = {0.}, tau_strong_res_conservative[5] = {0};
bb8a0c61SJames Wright    CeedScalar tau_strong_conv[5] = {0.}, tau_strong_conv_conservative[5] = {0};
bb8a0c61SJames Wright    CeedScalar Tau_d[3] = {0.};
3a8779fbSJames Wright    switch (context->stabilization) {
3a8779fbSJames Wright    case STAB_NONE:        // Galerkin
3a8779fbSJames Wright      break;
3a8779fbSJames Wright    case STAB_SU:        // SU
c1a52365SJed Brown      Tau_diagPrim(Tau_d, dXdx, s.Y.velocity, cv, context, mu, dt, s.U.density);
bb8a0c61SJames Wright      tau_strong_conv[0] = Tau_d[0] * strong_conv[0];
bb8a0c61SJames Wright      tau_strong_conv[1] = Tau_d[1] * strong_conv[1];
bb8a0c61SJames Wright      tau_strong_conv[2] = Tau_d[1] * strong_conv[2];
bb8a0c61SJames Wright      tau_strong_conv[3] = Tau_d[1] * strong_conv[3];
bb8a0c61SJames Wright      tau_strong_conv[4] = Tau_d[2] * strong_conv[4];
c1a52365SJed Brown      PrimitiveToConservative_fwd(s.U.density, s.Y.velocity, s.U.E_total, Rd, cv,
c1a52365SJed Brown                                  tau_strong_conv, tau_strong_conv_conservative);
493642f1SJames Wright      for (CeedInt j=0; j<3; j++)
493642f1SJames Wright        for (CeedInt k=0; k<5; k++)
493642f1SJames Wright          for (CeedInt l=0; l<5; l++)
bb8a0c61SJames Wright            stab[k][j] += jacob_F_conv[j][k][l] * tau_strong_conv_conservative[l];
3a8779fbSJames Wright
493642f1SJames Wright      for (CeedInt j=0; j<5; j++)
493642f1SJames Wright        for (CeedInt k=0; k<3; k++)
752f40e3SJed Brown          Grad_v[k][j][i] += wdetJ*(stab[j][0] * dXdx[k][0] +
3a8779fbSJames Wright                                    stab[j][1] * dXdx[k][1] +
3a8779fbSJames Wright                                    stab[j][2] * dXdx[k][2]);
eef2387dSJed Brown
3a8779fbSJames Wright      break;
3a8779fbSJames Wright    case STAB_SUPG:        // SUPG
c1a52365SJed Brown      Tau_diagPrim(Tau_d, dXdx, s.Y.velocity, cv, context, mu, dt, s.U.density);
bb8a0c61SJames Wright      tau_strong_res[0] = Tau_d[0] * strong_res[0];
bb8a0c61SJames Wright      tau_strong_res[1] = Tau_d[1] * strong_res[1];
bb8a0c61SJames Wright      tau_strong_res[2] = Tau_d[1] * strong_res[2];
bb8a0c61SJames Wright      tau_strong_res[3] = Tau_d[1] * strong_res[3];
bb8a0c61SJames Wright      tau_strong_res[4] = Tau_d[2] * strong_res[4];
bb8a0c61SJames Wright// Alternate route (useful later with primitive variable code)
bb8a0c61SJames Wright// this function was verified against PHASTA for as IC that was as close as possible
bb8a0c61SJames Wright//    computeFluxJacobian_NSp(jacob_F_conv_p, rho, u, E, Rd, cv);
bb8a0c61SJames Wright// it has also been verified to compute a correct through the following
bb8a0c61SJames Wright//   stab[k][j] += jacob_F_conv_p[j][k][l] * tau_strong_res[l] // flux Jacobian wrt primitive
bb8a0c61SJames Wright// applied in the triple loop below
bb8a0c61SJames Wright//  However, it is more flops than using the existing Jacobian wrt q after q_{,Y} viz
c1a52365SJed Brown      PrimitiveToConservative_fwd(s.U.density, s.Y.velocity, s.U.E_total, Rd, cv,
c1a52365SJed Brown                                  tau_strong_res, tau_strong_res_conservative);
493642f1SJames Wright      for (CeedInt j=0; j<3; j++)
493642f1SJames Wright        for (CeedInt k=0; k<5; k++)
493642f1SJames Wright          for (CeedInt l=0; l<5; l++)
bb8a0c61SJames Wright            stab[k][j] += jacob_F_conv[j][k][l] * tau_strong_res_conservative[l];
3a8779fbSJames Wright
493642f1SJames Wright      for (CeedInt j=0; j<5; j++)
493642f1SJames Wright        for (CeedInt k=0; k<3; k++)
752f40e3SJed Brown          Grad_v[k][j][i] += wdetJ*(stab[j][0] * dXdx[k][0] +
3a8779fbSJames Wright                                    stab[j][1] * dXdx[k][1] +
3a8779fbSJames Wright                                    stab[j][2] * dXdx[k][2]);
3a8779fbSJames Wright      break;
3a8779fbSJames Wright    }
eef2387dSJed Brown    for (CeedInt j=0; j<5; j++) jac_data[j][i] = U[j];
eef2387dSJed Brown    for (CeedInt j=0; j<6; j++) jac_data[5+j][i] = kmstress[j];
eef2387dSJed Brown    for (CeedInt j=0; j<3; j++) jac_data[5+6+j][i] = Tau_d[j];
3a8779fbSJames Wright
3a8779fbSJames Wright  } // End Quadrature Point Loop
3a8779fbSJames Wright
3a8779fbSJames Wright  // Return
3a8779fbSJames Wright  return 0;
3a8779fbSJames Wright}
f0b65372SJed Brown
f0b65372SJed BrownCEED_QFUNCTION(IJacobian_Newtonian)(void *ctx, CeedInt Q,
f0b65372SJed Brown                                    const CeedScalar *const *in,
f0b65372SJed Brown                                    CeedScalar *const *out) {
f0b65372SJed Brown  // *INDENT-OFF*
f0b65372SJed Brown  // Inputs
f0b65372SJed Brown  const CeedScalar (*dq)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0],
f0b65372SJed Brown                   (*Grad_dq)[5][CEED_Q_VLA] = (const CeedScalar(*)[5][CEED_Q_VLA])in[1],
f0b65372SJed Brown                   (*q_data)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2],
f0b65372SJed Brown                   (*x)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3],
f0b65372SJed Brown                   (*jac_data)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[4];
f0b65372SJed Brown  // Outputs
f0b65372SJed Brown  CeedScalar (*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0],
f0b65372SJed Brown             (*Grad_v)[5][CEED_Q_VLA] = (CeedScalar(*)[5][CEED_Q_VLA])out[1];
f0b65372SJed Brown  // *INDENT-ON*
f0b65372SJed Brown  // Context
f0b65372SJed Brown  NewtonianIdealGasContext context = (NewtonianIdealGasContext)ctx;
f0b65372SJed Brown  const CeedScalar *g = context->g;
f0b65372SJed Brown  const CeedScalar cp = context->cp;
f0b65372SJed Brown  const CeedScalar cv = context->cv;
f0b65372SJed Brown  const CeedScalar Rd = cp - cv;
f0b65372SJed Brown  const CeedScalar gamma = cp / cv;
f0b65372SJed Brown
f0b65372SJed Brown  CeedPragmaSIMD
f0b65372SJed Brown  // Quadrature Point Loop
f0b65372SJed Brown  for (CeedInt i=0; i<Q; i++) {
f0b65372SJed Brown    // -- Interp-to-Interp q_data
f0b65372SJed Brown    const CeedScalar wdetJ      =   q_data[0][i];
f0b65372SJed Brown    // -- Interp-to-Grad q_data
f0b65372SJed Brown    // ---- Inverse of change of coordinate matrix: X_i,j
f0b65372SJed Brown    // *INDENT-OFF*
f0b65372SJed Brown    const CeedScalar dXdx[3][3] = {{q_data[1][i],
f0b65372SJed Brown                                    q_data[2][i],
f0b65372SJed Brown                                    q_data[3][i]},
f0b65372SJed Brown                                   {q_data[4][i],
f0b65372SJed Brown                                    q_data[5][i],
f0b65372SJed Brown                                    q_data[6][i]},
f0b65372SJed Brown                                   {q_data[7][i],
f0b65372SJed Brown                                    q_data[8][i],
f0b65372SJed Brown                                    q_data[9][i]}
f0b65372SJed Brown                                  };
f0b65372SJed Brown    // *INDENT-ON*
f0b65372SJed Brown
f0b65372SJed Brown    CeedScalar U[5], kmstress[6], Tau_d[3] __attribute((unused));
f0b65372SJed Brown    for (int j=0; j<5; j++) U[j] = jac_data[j][i];
f0b65372SJed Brown    for (int j=0; j<6; j++) kmstress[j] = jac_data[5+j][i];
f0b65372SJed Brown    for (int j=0; j<3; j++) Tau_d[j] = jac_data[5+6+j][i];
f0b65372SJed Brown    const CeedScalar x_i[3] = {x[0][i], x[1][i], x[2][i]};
f0b65372SJed Brown    State s = StateFromU(context, U, x_i);
f0b65372SJed Brown
f0b65372SJed Brown    CeedScalar dU[5], dx0[3] = {0};
f0b65372SJed Brown    for (int j=0; j<5; j++) dU[j] = dq[j][i];
f0b65372SJed Brown    State ds = StateFromU_fwd(context, s, dU, x_i, dx0);
f0b65372SJed Brown
f0b65372SJed Brown    State grad_ds[3];
f0b65372SJed Brown    for (int j=0; j<3; j++) {
f0b65372SJed Brown      CeedScalar dUj[5];
f0b65372SJed Brown      for (int k=0; k<5; k++) dUj[k] = Grad_dq[0][k][i] * dXdx[0][j]
f0b65372SJed Brown                                         + Grad_dq[1][k][i] * dXdx[1][j]
f0b65372SJed Brown                                         + Grad_dq[2][k][i] * dXdx[2][j];
f0b65372SJed Brown      grad_ds[j] = StateFromU_fwd(context, s, dUj, x_i, dx0);
f0b65372SJed Brown    }
f0b65372SJed Brown
f0b65372SJed Brown    CeedScalar dstrain_rate[6], dkmstress[6], stress[3][3], dstress[3][3], dFe[3];
f0b65372SJed Brown    KMStrainRate(grad_ds, dstrain_rate);
f0b65372SJed Brown    NewtonianStress(context, dstrain_rate, dkmstress);
f0b65372SJed Brown    KMUnpack(dkmstress, dstress);
f0b65372SJed Brown    KMUnpack(kmstress, stress);
f0b65372SJed Brown    ViscousEnergyFlux_fwd(context, s.Y, ds.Y, grad_ds, stress, dstress, dFe);
f0b65372SJed Brown
f0b65372SJed Brown    StateConservative dF_inviscid[3];
f0b65372SJed Brown    FluxInviscid_fwd(context, s, ds, dF_inviscid);
f0b65372SJed Brown
f0b65372SJed Brown    // Total flux
f0b65372SJed Brown    CeedScalar dFlux[5][3];
f0b65372SJed Brown    for (int j=0; j<3; j++) {
f0b65372SJed Brown      dFlux[0][j] = dF_inviscid[j].density;
f0b65372SJed Brown      for (int k=0; k<3; k++)
f0b65372SJed Brown        dFlux[k+1][j] = dF_inviscid[j].momentum[k] - dstress[k][j];
f0b65372SJed Brown      dFlux[4][j] = dF_inviscid[j].E_total + dFe[j];
f0b65372SJed Brown    }
f0b65372SJed Brown
f0b65372SJed Brown    for (int j=0; j<3; j++) {
f0b65372SJed Brown      for (int k=0; k<5; k++) {
f0b65372SJed Brown        Grad_v[j][k][i] = -wdetJ * (dXdx[j][0] * dFlux[k][0] +
f0b65372SJed Brown                                    dXdx[j][1] * dFlux[k][1] +
f0b65372SJed Brown                                    dXdx[j][2] * dFlux[k][2]);
f0b65372SJed Brown      }
f0b65372SJed Brown    }
f0b65372SJed Brown
f0b65372SJed Brown    const CeedScalar dbody_force[5] = {0, ds.U.density *g[0], ds.U.density *g[1], ds.U.density *g[2], 0};
f0b65372SJed Brown    for (int j=0; j<5; j++)
f0b65372SJed Brown      v[j][i] = wdetJ * (context->ijacobian_time_shift * dU[j] - dbody_force[j]);
f0b65372SJed Brown
f0b65372SJed Brown    if (1) {
f0b65372SJed Brown      CeedScalar jacob_F_conv[3][5][5] = {0};
f0b65372SJed Brown      computeFluxJacobian_NS(jacob_F_conv, s.U.density, s.Y.velocity, s.U.E_total,
f0b65372SJed Brown                             gamma, g, x_i);
f0b65372SJed Brown      CeedScalar grad_dU[5][3];
f0b65372SJed Brown      for (int j=0; j<3; j++) {
f0b65372SJed Brown        grad_dU[0][j] = grad_ds[j].U.density;
f0b65372SJed Brown        for (int k=0; k<3; k++) grad_dU[k+1][j] = grad_ds[j].U.momentum[k];
f0b65372SJed Brown        grad_dU[4][j] = grad_ds[j].U.E_total;
f0b65372SJed Brown      }
f0b65372SJed Brown      CeedScalar dstrong_conv[5] = {0};
f0b65372SJed Brown      for (int j=0; j<3; j++)
f0b65372SJed Brown        for (int k=0; k<5; k++)
f0b65372SJed Brown          for (int l=0; l<5; l++)
f0b65372SJed Brown            dstrong_conv[k] += jacob_F_conv[j][k][l] * grad_dU[l][j];
f0b65372SJed Brown      CeedScalar dstrong_res[5];
f0b65372SJed Brown      for (int j=0; j<5; j++)
f0b65372SJed Brown        dstrong_res[j] = context->ijacobian_time_shift * dU[j] + dstrong_conv[j] -
f0b65372SJed Brown                         dbody_force[j];
f0b65372SJed Brown      CeedScalar dtau_strong_res[5] = {0.}, dtau_strong_res_conservative[5] = {0};
f0b65372SJed Brown      dtau_strong_res[0] = Tau_d[0] * dstrong_res[0];
f0b65372SJed Brown      dtau_strong_res[1] = Tau_d[1] * dstrong_res[1];
f0b65372SJed Brown      dtau_strong_res[2] = Tau_d[1] * dstrong_res[2];
f0b65372SJed Brown      dtau_strong_res[3] = Tau_d[1] * dstrong_res[3];
f0b65372SJed Brown      dtau_strong_res[4] = Tau_d[2] * dstrong_res[4];
f0b65372SJed Brown      PrimitiveToConservative_fwd(s.U.density, s.Y.velocity, s.U.E_total, Rd, cv,
f0b65372SJed Brown                                  dtau_strong_res, dtau_strong_res_conservative);
f0b65372SJed Brown      CeedScalar dstab[5][3] = {0};
f0b65372SJed Brown      for (int j=0; j<3; j++)
f0b65372SJed Brown        for (int k=0; k<5; k++)
f0b65372SJed Brown          for (int l=0; l<5; l++)
f0b65372SJed Brown            dstab[k][j] += jacob_F_conv[j][k][l] * dtau_strong_res_conservative[l];
f0b65372SJed Brown      for (int j=0; j<5; j++)
f0b65372SJed Brown        for (int k=0; k<3; k++)
f0b65372SJed Brown          Grad_v[k][j][i] += wdetJ*(dstab[j][0] * dXdx[k][0] +
f0b65372SJed Brown                                    dstab[j][1] * dXdx[k][1] +
f0b65372SJed Brown                                    dstab[j][2] * dXdx[k][2]);
f0b65372SJed Brown
f0b65372SJed Brown    }
f0b65372SJed Brown  } // End Quadrature Point Loop
f0b65372SJed Brown  return 0;
f0b65372SJed Brown}
*8085925cSJames Wright
*8085925cSJames Wright// Compute boundary integral (ie. for strongly set inflows)
*8085925cSJames WrightCEED_QFUNCTION(BoundaryIntegral)(void *ctx, CeedInt Q,
*8085925cSJames Wright                                 const CeedScalar *const *in,
*8085925cSJames Wright                                 CeedScalar *const *out) {
*8085925cSJames Wright
*8085925cSJames Wright  //*INDENT-OFF*
*8085925cSJames Wright  const CeedScalar (*q)[CEED_Q_VLA]          = (const CeedScalar(*)[CEED_Q_VLA]) in[0],
*8085925cSJames Wright                   (*q_data_sur)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA]) in[2];
*8085925cSJames Wright
*8085925cSJames Wright  CeedScalar (*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA]) out[0];
*8085925cSJames Wright
*8085925cSJames Wright  //*INDENT-ON*
*8085925cSJames Wright
*8085925cSJames Wright  const NewtonianIdealGasContext newt_ctx = (NewtonianIdealGasContext) ctx;
*8085925cSJames Wright  const bool is_implicit  = newt_ctx->is_implicit;
*8085925cSJames Wright  const CeedScalar cv     = newt_ctx->cv;
*8085925cSJames Wright  const CeedScalar cp     = newt_ctx->cp;
*8085925cSJames Wright  const CeedScalar gamma  = cp/cv;
*8085925cSJames Wright
*8085925cSJames Wright  CeedPragmaSIMD
*8085925cSJames Wright  for(CeedInt i=0; i<Q; i++) {
*8085925cSJames Wright    const CeedScalar rho        = q[0][i];
*8085925cSJames Wright    const CeedScalar u[]        = {q[1][i]/rho, q[2][i]/rho, q[3][i]/rho};
*8085925cSJames Wright    const CeedScalar E_kinetic  = .5 * rho * (u[0]*u[0] + u[1]*u[1] + u[2]*u[2]);
*8085925cSJames Wright    const CeedScalar E_internal = q[4][i] - E_kinetic;
*8085925cSJames Wright    const CeedScalar P          = E_internal * (gamma - 1.);
*8085925cSJames Wright
*8085925cSJames Wright    const CeedScalar wdetJb  = (is_implicit ? -1. : 1.) * q_data_sur[0][i];
*8085925cSJames Wright    // ---- Normal vect
*8085925cSJames Wright    const CeedScalar norm[3] = {q_data_sur[1][i],
*8085925cSJames Wright                                q_data_sur[2][i],
*8085925cSJames Wright                                q_data_sur[3][i]
*8085925cSJames Wright                               };
*8085925cSJames Wright
*8085925cSJames Wright    const CeedScalar E = E_internal + E_kinetic;
*8085925cSJames Wright
*8085925cSJames Wright    // Velocity normal to the boundary
*8085925cSJames Wright    const CeedScalar u_normal = norm[0]*u[0] +
*8085925cSJames Wright                                norm[1]*u[1] +
*8085925cSJames Wright                                norm[2]*u[2];
*8085925cSJames Wright    // The Physics
*8085925cSJames Wright    // Zero v so all future terms can safely sum into it
*8085925cSJames Wright    for (CeedInt j=0; j<5; j++) v[j][i] = 0.;
*8085925cSJames Wright
*8085925cSJames Wright    // The Physics
*8085925cSJames Wright    // -- Density
*8085925cSJames Wright    v[0][i] -= wdetJb * rho * u_normal;
*8085925cSJames Wright
*8085925cSJames Wright    // -- Momentum
*8085925cSJames Wright    for (CeedInt j=0; j<3; j++)
*8085925cSJames Wright      v[j+1][i] -= wdetJb *(rho * u_normal * u[j] +
*8085925cSJames Wright                            norm[j] * P);
*8085925cSJames Wright
*8085925cSJames Wright    // -- Total Energy Density
*8085925cSJames Wright    v[4][i] -= wdetJb * u_normal * (E + P);
*8085925cSJames Wright  }
*8085925cSJames Wright  return 0;
*8085925cSJames Wright}
*8085925cSJames Wright
3a8779fbSJames Wright// *****************************************************************************
3a8779fbSJames Wright#endif // newtonian_h