xref: /honee/qfunctions/sgs_dd_model.h (revision 4c07ec2294887c4a114ef13a7c2da0ab5f5dc208)
1dc936754SJeremy L Thompson // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors.
262b7942eSJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details.
362b7942eSJames Wright //
462b7942eSJames Wright // SPDX-License-Identifier: BSD-2-Clause
562b7942eSJames Wright //
662b7942eSJames Wright // This file is part of CEED:  http://github.com/ceed
762b7942eSJames Wright 
862b7942eSJames Wright /// @file
9952746efSJames Wright /// Structs and helper functions to evaluate data-driven subgrid-stress modeling
103fc405b4SJames Wright /// See 'Invariant data-driven subgrid stress modeling in the strain-rate eigenframe for large eddy simulation' 2022 and 'S-frame discrepancy
113fc405b4SJames Wright /// correction models for data-informed Reynolds stress closure' 2022
1262b7942eSJames Wright #include <ceed.h>
1362b7942eSJames Wright 
143fc405b4SJames Wright #include "newtonian_state.h"
159c678832SJames Wright #include "newtonian_types.h"
16952746efSJames Wright #include "sgs_dd_utils.h"
173fc405b4SJames Wright #include "utils.h"
183fc405b4SJames Wright #include "utils_eigensolver_jacobi.h"
193fc405b4SJames Wright 
20ad494f68SJames Wright typedef struct SgsDDContext_ *SgsDDContext;
21ad494f68SJames Wright struct SgsDDContext_ {
2262b7942eSJames Wright   CeedInt    num_inputs, num_outputs;
2362b7942eSJames Wright   CeedInt    num_layers;
2462b7942eSJames Wright   CeedInt    num_neurons;
2562b7942eSJames Wright   CeedScalar alpha;
2662b7942eSJames Wright 
27ee1455b7SJames Wright   struct NewtonianIdealGasContext_ gas;
2862b7942eSJames Wright   struct {
2962b7942eSJames Wright     size_t bias1, bias2;
3062b7942eSJames Wright     size_t weight1, weight2;
3162b7942eSJames Wright     size_t out_scaling;
3262b7942eSJames Wright   } offsets;
3362b7942eSJames Wright   size_t     total_bytes;
3462b7942eSJames Wright   CeedScalar data[1];
3562b7942eSJames Wright };
3662b7942eSJames Wright 
373fc405b4SJames Wright CEED_QFUNCTION_HELPER void LeakyReLU(CeedScalar *x, const CeedScalar alpha, const CeedInt N) {
383fc405b4SJames Wright   for (CeedInt i = 0; i < N; i++) x[i] *= (x[i] < 0 ? alpha : 1.);
393fc405b4SJames Wright }
403fc405b4SJames Wright 
41ad494f68SJames Wright CEED_QFUNCTION_HELPER void DataDrivenInference(const CeedScalar *inputs, CeedScalar *outputs, SgsDDContext sgsdd_ctx) {
423fc405b4SJames Wright   const CeedInt     num_neurons = sgsdd_ctx->num_neurons;
433fc405b4SJames Wright   const CeedInt     num_inputs  = sgsdd_ctx->num_inputs;
443fc405b4SJames Wright   const CeedInt     num_outputs = sgsdd_ctx->num_outputs;
453fc405b4SJames Wright   const CeedScalar  alpha       = sgsdd_ctx->alpha;
463fc405b4SJames Wright   const CeedScalar *bias1       = &sgsdd_ctx->data[sgsdd_ctx->offsets.bias1];
473fc405b4SJames Wright   const CeedScalar *bias2       = &sgsdd_ctx->data[sgsdd_ctx->offsets.bias2];
483fc405b4SJames Wright   const CeedScalar *weight1     = &sgsdd_ctx->data[sgsdd_ctx->offsets.weight1];
493fc405b4SJames Wright   const CeedScalar *weight2     = &sgsdd_ctx->data[sgsdd_ctx->offsets.weight2];
503fc405b4SJames Wright   CeedScalar        V[20]       = {0.};
513fc405b4SJames Wright 
523fc405b4SJames Wright   CopyN(bias1, V, num_neurons);
533fc405b4SJames Wright   MatVecNM(weight1, inputs, num_neurons, num_inputs, CEED_NOTRANSPOSE, V);
543fc405b4SJames Wright   LeakyReLU(V, alpha, num_neurons);
553fc405b4SJames Wright   CopyN(bias2, outputs, num_outputs);
563fc405b4SJames Wright   MatVecNM(weight2, V, num_outputs, num_neurons, CEED_NOTRANSPOSE, outputs);
573fc405b4SJames Wright }
583fc405b4SJames Wright 
59ad494f68SJames Wright CEED_QFUNCTION_HELPER void ComputeSgsDD_Fused(const CeedScalar grad_velo_aniso[3][3], const CeedScalar km_A_ij[6], const CeedScalar delta,
60ad494f68SJames Wright                                               const CeedScalar viscosity, CeedScalar kmsgs_stress[6], SgsDDContext sgsdd_ctx) {
61be75532aSJames Wright   CeedScalar inputs[6], grad_velo_magnitude, eigenvectors[3][3], sgs_sframe_sym[6] = {0.}, new_bounds[6][2];
62be75532aSJames Wright   // Copying new_bounds because Sycl online compiler doesn't like direct casting the pointer
63be75532aSJames Wright   CopyN(&sgsdd_ctx->data[sgsdd_ctx->offsets.out_scaling], (CeedScalar *)new_bounds, 12);
64db588195SJames Wright 
65ad494f68SJames Wright   ComputeSgsDDInputs(grad_velo_aniso, km_A_ij, delta, viscosity, eigenvectors, inputs, &grad_velo_magnitude);
663fc405b4SJames Wright   DataDrivenInference(inputs, sgs_sframe_sym, sgsdd_ctx);
67ad494f68SJames Wright   ComputeSgsDDOutputs(sgs_sframe_sym, delta, eigenvectors, new_bounds, grad_velo_magnitude, kmsgs_stress);
683fc405b4SJames Wright }
693fc405b4SJames Wright 
70ee1455b7SJames Wright // @brief Calculate subgrid stress at nodes using anisotropic data-driven model
71ad494f68SJames Wright CEED_QFUNCTION_HELPER int ComputeSgsDDNodal_Fused(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out,
728fff8293SJames Wright                                                   StateVariable state_var) {
73ee1455b7SJames Wright   const CeedScalar(*q)[CEED_Q_VLA]            = (const CeedScalar(*)[CEED_Q_VLA])in[0];
74ee1455b7SJames Wright   const CeedScalar(*grad_velo)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[2];
75ee1455b7SJames Wright   const CeedScalar(*A_ij_delta)[CEED_Q_VLA]   = (const CeedScalar(*)[CEED_Q_VLA])in[3];
76ee1455b7SJames Wright   const CeedScalar(*inv_multiplicity)         = (const CeedScalar(*))in[4];
77ee1455b7SJames Wright   CeedScalar(*v)[CEED_Q_VLA]                  = (CeedScalar(*)[CEED_Q_VLA])out[0];
78ee1455b7SJames Wright 
79ad494f68SJames Wright   const SgsDDContext             sgsdd_ctx = (SgsDDContext)ctx;
80ee1455b7SJames Wright   const NewtonianIdealGasContext gas       = &sgsdd_ctx->gas;
81ee1455b7SJames Wright 
82ee1455b7SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
83ee1455b7SJames Wright     const CeedScalar qi[5]                 = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]};
84ee1455b7SJames Wright     const CeedScalar grad_velo_aniso[3][3] = {
85ee1455b7SJames Wright         {grad_velo[0][0][i], grad_velo[0][1][i], grad_velo[0][2][i]},
86ee1455b7SJames Wright         {grad_velo[1][0][i], grad_velo[1][1][i], grad_velo[1][2][i]},
87ee1455b7SJames Wright         {grad_velo[2][0][i], grad_velo[2][1][i], grad_velo[2][2][i]}
88ee1455b7SJames Wright     };
89ee1455b7SJames Wright     const CeedScalar km_A_ij[6] = {A_ij_delta[0][i], A_ij_delta[1][i], A_ij_delta[2][i], A_ij_delta[3][i], A_ij_delta[4][i], A_ij_delta[5][i]};
90ee1455b7SJames Wright     const CeedScalar delta      = A_ij_delta[6][i];
91edcfef1bSKenneth E. Jansen     const State      s          = StateFromQ(gas, qi, state_var);
92ee1455b7SJames Wright     CeedScalar       km_sgs[6];
93ee1455b7SJames Wright 
94ad494f68SJames Wright     ComputeSgsDD_Fused(grad_velo_aniso, km_A_ij, delta, gas->mu / s.U.density, km_sgs, sgsdd_ctx);
95ee1455b7SJames Wright 
96ee1455b7SJames Wright     for (int j = 0; j < 6; j++) v[j][i] = inv_multiplicity[i] * km_sgs[j];
97ee1455b7SJames Wright   }
98ee1455b7SJames Wright   return 0;
99ee1455b7SJames Wright }
100ee1455b7SJames Wright 
101ad494f68SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
102ad494f68SJames Wright   return ComputeSgsDDNodal_Fused(ctx, Q, in, out, STATEVAR_PRIMITIVE);
103ee1455b7SJames Wright }
104ee1455b7SJames Wright 
105ad494f68SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
106ad494f68SJames Wright   return ComputeSgsDDNodal_Fused(ctx, Q, in, out, STATEVAR_CONSERVATIVE);
107ee1455b7SJames Wright }
108ee1455b7SJames Wright 
1093ec34a3dSJames Wright // @brief Calculate inputs to anisotropic data-driven model
1103ec34a3dSJames Wright CEED_QFUNCTION_HELPER int ComputeSgsDDNodal_Sequential_Inputs(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out,
1113ec34a3dSJames Wright                                                               StateVariable state_var) {
1123ec34a3dSJames Wright   const CeedScalar(*q)[CEED_Q_VLA]            = (const CeedScalar(*)[CEED_Q_VLA])in[0];
1133ec34a3dSJames Wright   const CeedScalar(*grad_velo)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[1];
1143ec34a3dSJames Wright   const CeedScalar(*A_ij_delta)[CEED_Q_VLA]   = (const CeedScalar(*)[CEED_Q_VLA])in[2];
1153ec34a3dSJames Wright   const CeedScalar(*inv_multiplicity)         = (const CeedScalar(*))in[3];
1163ec34a3dSJames Wright   CeedScalar(*eigenvectors_stored)            = out[0];
1173ec34a3dSJames Wright   CeedScalar(*model_inputs)[CEED_Q_VLA]       = (CeedScalar(*)[CEED_Q_VLA])out[1];
1183ec34a3dSJames Wright 
119b87d60b3SJames Wright   const SgsDDContext             sgsdd_ctx = (SgsDDContext)ctx;
1203ec34a3dSJames Wright   const NewtonianIdealGasContext gas       = &sgsdd_ctx->gas;
1213ec34a3dSJames Wright 
1223ec34a3dSJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
1233ec34a3dSJames Wright     const CeedScalar qi[5]                 = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]};
1243ec34a3dSJames Wright     const CeedScalar grad_velo_aniso[3][3] = {
1253ec34a3dSJames Wright         {grad_velo[0][0][i], grad_velo[0][1][i], grad_velo[0][2][i]},
1263ec34a3dSJames Wright         {grad_velo[1][0][i], grad_velo[1][1][i], grad_velo[1][2][i]},
1273ec34a3dSJames Wright         {grad_velo[2][0][i], grad_velo[2][1][i], grad_velo[2][2][i]}
1283ec34a3dSJames Wright     };
1293ec34a3dSJames Wright     const CeedScalar km_A_ij[6] = {A_ij_delta[0][i], A_ij_delta[1][i], A_ij_delta[2][i], A_ij_delta[3][i], A_ij_delta[4][i], A_ij_delta[5][i]};
1303ec34a3dSJames Wright     const CeedScalar delta      = A_ij_delta[6][i];
1313ec34a3dSJames Wright     const State      s          = StateFromQ(gas, qi, state_var);
1323ec34a3dSJames Wright 
1333ec34a3dSJames Wright     CeedScalar model_inputs_i[6], grad_velo_magnitude, eigenvectors[3][3];
1343ec34a3dSJames Wright     ComputeSgsDDInputs(grad_velo_aniso, km_A_ij, delta, gas->mu / s.U.density, eigenvectors, model_inputs_i, &grad_velo_magnitude);
1353ec34a3dSJames Wright 
1363ec34a3dSJames Wright     ScaleN(model_inputs_i, inv_multiplicity[i], 6);
1373ec34a3dSJames Wright     StoredValuesPack(Q, i, 0, 6, model_inputs_i, (CeedScalar *)model_inputs);
1383ec34a3dSJames Wright     StoredValuesPack(Q, i, 0, 9, (const CeedScalar *)eigenvectors, eigenvectors_stored);
139b87d60b3SJames Wright     StoredValuesPack(Q, i, 9, 1, &grad_velo_magnitude, eigenvectors_stored);
1403ec34a3dSJames Wright   }
1413ec34a3dSJames Wright   return CEED_ERROR_SUCCESS;
1423ec34a3dSJames Wright }
1433ec34a3dSJames Wright 
1443ec34a3dSJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inputs_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
1453ec34a3dSJames Wright   return ComputeSgsDDNodal_Sequential_Inputs(ctx, Q, in, out, STATEVAR_PRIMITIVE);
1463ec34a3dSJames Wright }
1473ec34a3dSJames Wright 
1483ec34a3dSJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inputs_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
1493ec34a3dSJames Wright   return ComputeSgsDDNodal_Sequential_Inputs(ctx, Q, in, out, STATEVAR_CONSERVATIVE);
1503ec34a3dSJames Wright }
1513ec34a3dSJames Wright 
152b87d60b3SJames Wright // @brief Runs inference on the data-driven model, used predominantsly for testing and validation
153b87d60b3SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inference)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
154b87d60b3SJames Wright   const CeedScalar(*model_inputs)     = in[0];
155b87d60b3SJames Wright   const CeedScalar(*inv_multiplicity) = in[1];
156b87d60b3SJames Wright   CeedScalar(*model_outputs)          = out[0];
157b87d60b3SJames Wright 
158b87d60b3SJames Wright   const SgsDDContext sgsdd_ctx = (SgsDDContext)ctx;
159b87d60b3SJames Wright 
160b87d60b3SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
161b87d60b3SJames Wright     CeedScalar model_inputs_i[6], model_outputs_i[6];
162*4c07ec22SJames Wright     // CeedScalar model_outputs_i[6];
163*4c07ec22SJames Wright     // CeedScalar model_inputs_i[6] = {1, 2, 3, 4, 5, 6};
164b87d60b3SJames Wright 
165b87d60b3SJames Wright     StoredValuesUnpack(Q, i, 0, 6, (const CeedScalar *)model_inputs, model_inputs_i);
166b87d60b3SJames Wright     DataDrivenInference(model_inputs_i, model_outputs_i, sgsdd_ctx);
167b87d60b3SJames Wright     ScaleN(model_outputs_i, inv_multiplicity[i], 6);
168b87d60b3SJames Wright     StoredValuesPack(Q, i, 0, 6, model_outputs_i, model_outputs);
169b87d60b3SJames Wright   }
170b87d60b3SJames Wright   return CEED_ERROR_SUCCESS;
171b87d60b3SJames Wright }
172b87d60b3SJames Wright 
1733ec34a3dSJames Wright // @brief Calculates SGS from outputs of anisotropic data-driven model
174b87d60b3SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Outputs)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
175b87d60b3SJames Wright   const CeedScalar(*model_outputs)          = in[0];
176b87d60b3SJames Wright   const CeedScalar(*A_ij_delta)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[1];
177b87d60b3SJames Wright   const CeedScalar(*inv_multiplicity)       = (const CeedScalar(*))in[2];
178b87d60b3SJames Wright   const CeedScalar(*eigenvectors_stored)    = in[3];
1793ec34a3dSJames Wright   CeedScalar(*kmsgs_stress)[CEED_Q_VLA]     = (CeedScalar(*)[CEED_Q_VLA])out[0];
1803ec34a3dSJames Wright 
181b87d60b3SJames Wright   const SgsDDContext sgsdd_ctx = (SgsDDContext)ctx;
1823ec34a3dSJames Wright   CeedScalar         new_bounds[6][2];
1833ec34a3dSJames Wright   CopyN(&sgsdd_ctx->data[sgsdd_ctx->offsets.out_scaling], (CeedScalar *)new_bounds, 12);
1843ec34a3dSJames Wright 
1853ec34a3dSJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
186b87d60b3SJames Wright     CeedScalar       model_outputs_i[6];
1873ec34a3dSJames Wright     const CeedScalar delta = A_ij_delta[6][i];
1883ec34a3dSJames Wright 
1893ec34a3dSJames Wright     StoredValuesUnpack(Q, i, 0, 6, model_outputs, model_outputs_i);
1903ec34a3dSJames Wright     CeedScalar grad_velo_magnitude, eigenvectors[3][3], kmsgs_stress_i[6];
1913ec34a3dSJames Wright     StoredValuesUnpack(Q, i, 0, 9, eigenvectors_stored, (CeedScalar *)eigenvectors);
192b87d60b3SJames Wright     StoredValuesUnpack(Q, i, 9, 1, eigenvectors_stored, &grad_velo_magnitude);
1933ec34a3dSJames Wright     ComputeSgsDDOutputs(model_outputs_i, delta, eigenvectors, new_bounds, grad_velo_magnitude, kmsgs_stress_i);
1943ec34a3dSJames Wright 
1953ec34a3dSJames Wright     for (int j = 0; j < 6; j++) kmsgs_stress[j][i] = inv_multiplicity[i] * kmsgs_stress_i[j];
1963ec34a3dSJames Wright   }
1973ec34a3dSJames Wright   return CEED_ERROR_SUCCESS;
1983ec34a3dSJames Wright }
1993ec34a3dSJames Wright 
2009c678832SJames Wright // @brief Adds subgrid stress to residual (during IFunction evaluation)
2019c678832SJames Wright CEED_QFUNCTION_HELPER int FluxSubgridStress(const StatePrimitive Y, const CeedScalar km_sgs[6], CeedScalar Flux[5][3]) {
2029c678832SJames Wright   CeedScalar sgs[3][3];
2039c678832SJames Wright 
2049c678832SJames Wright   KMUnpack(km_sgs, sgs);
2059c678832SJames Wright   for (CeedInt j = 0; j < 3; j++) {
2069c678832SJames Wright     Flux[0][j] = 0.;
2079c678832SJames Wright     for (CeedInt k = 0; k < 3; k++) Flux[k + 1][j] = sgs[k][j];
2089c678832SJames Wright     Flux[4][j] = Y.velocity[0] * sgs[0][j] + Y.velocity[1] * sgs[1][j] + Y.velocity[2] * sgs[2][j];
2099c678832SJames Wright   }
2109c678832SJames Wright   return 0;
2119c678832SJames Wright }
2129c678832SJames Wright 
21342454adaSJames Wright CEED_QFUNCTION_HELPER int IFunction_NodalSgs(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out, StateVariable state_var) {
2149c678832SJames Wright   const CeedScalar(*q)[CEED_Q_VLA]      = (const CeedScalar(*)[CEED_Q_VLA])in[0];
215ade49511SJames Wright   const CeedScalar(*q_data)             = in[1];
216e985bffbSJames Wright   const CeedScalar(*km_sgs)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2];
2179c678832SJames Wright   CeedScalar(*Grad_v)[5][CEED_Q_VLA]    = (CeedScalar(*)[5][CEED_Q_VLA])out[0];
2189c678832SJames Wright 
21940816385SJames Wright   NewtonianIdealGasContext gas = (NewtonianIdealGasContext)ctx;
2209c678832SJames Wright 
2219c678832SJames Wright   CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) {
2229c678832SJames Wright     const CeedScalar qi[5] = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]};
223edcfef1bSKenneth E. Jansen     const State      s     = StateFromQ(gas, qi, state_var);
2249c678832SJames Wright 
225ade49511SJames Wright     CeedScalar wdetJ, dXdx[3][3];
226ade49511SJames Wright     QdataUnpack_3D(Q, i, q_data, &wdetJ, dXdx);
2279c678832SJames Wright 
2289c678832SJames Wright     CeedScalar       Flux[5][3];
2299c678832SJames Wright     const CeedScalar km_sgs_i[6] = {km_sgs[0][i], km_sgs[1][i], km_sgs[2][i], km_sgs[3][i], km_sgs[4][i], km_sgs[5][i]};
2309c678832SJames Wright     FluxSubgridStress(s.Y, km_sgs_i, Flux);
2319c678832SJames Wright 
2327523f6aaSJames Wright     for (CeedInt k = 0; k < 3; k++) {
2337523f6aaSJames Wright       for (CeedInt j = 0; j < 5; j++) {
2347523f6aaSJames Wright         Grad_v[k][j][i] = -wdetJ * (dXdx[k][0] * Flux[j][0] + dXdx[k][1] * Flux[j][1] + dXdx[k][2] * Flux[j][2]);
2359c678832SJames Wright       }
2369c678832SJames Wright     }
2379c678832SJames Wright   }
2389c678832SJames Wright   return 0;
2399c678832SJames Wright }
2409c678832SJames Wright 
24142454adaSJames Wright CEED_QFUNCTION(IFunction_NodalSgs_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
24242454adaSJames Wright   return IFunction_NodalSgs(ctx, Q, in, out, STATEVAR_CONSERVATIVE);
2439c678832SJames Wright }
2449c678832SJames Wright 
24542454adaSJames Wright CEED_QFUNCTION(IFunction_NodalSgs_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) {
24642454adaSJames Wright   return IFunction_NodalSgs(ctx, Q, in, out, STATEVAR_PRIMITIVE);
2479c678832SJames Wright }
248