1ae2b091fSJames Wright // SPDX-FileCopyrightText: Copyright (c) 2017-2024, HONEE contributors. 2ae2b091fSJames Wright // SPDX-License-Identifier: Apache-2.0 OR BSD-2-Clause 362b7942eSJames Wright 462b7942eSJames Wright /// @file 5952746efSJames Wright /// Structs and helper functions to evaluate data-driven subgrid-stress modeling 63fc405b4SJames Wright /// See 'Invariant data-driven subgrid stress modeling in the strain-rate eigenframe for large eddy simulation' 2022 and 'S-frame discrepancy 73fc405b4SJames Wright /// correction models for data-informed Reynolds stress closure' 2022 83e17a7a1SJames Wright #include <ceed/types.h> 962b7942eSJames Wright 103fc405b4SJames Wright #include "newtonian_state.h" 119c678832SJames Wright #include "newtonian_types.h" 12952746efSJames Wright #include "sgs_dd_utils.h" 133fc405b4SJames Wright #include "utils.h" 143fc405b4SJames Wright #include "utils_eigensolver_jacobi.h" 153fc405b4SJames Wright 16ad494f68SJames Wright typedef struct SgsDDContext_ *SgsDDContext; 17ad494f68SJames Wright struct SgsDDContext_ { 1862b7942eSJames Wright CeedInt num_inputs, num_outputs; 1962b7942eSJames Wright CeedInt num_layers; 2062b7942eSJames Wright CeedInt num_neurons; 2162b7942eSJames Wright CeedScalar alpha; 2262b7942eSJames Wright 23*cde3d787SJames Wright struct NewtonianIdealGasContext_ newt_ctx; 2462b7942eSJames Wright struct { 2562b7942eSJames Wright size_t bias1, bias2; 2662b7942eSJames Wright size_t weight1, weight2; 2762b7942eSJames Wright size_t out_scaling; 2862b7942eSJames Wright } offsets; 2962b7942eSJames Wright size_t total_bytes; 3062b7942eSJames Wright CeedScalar data[1]; 3162b7942eSJames Wright }; 3262b7942eSJames Wright 333fc405b4SJames Wright CEED_QFUNCTION_HELPER void LeakyReLU(CeedScalar *x, const CeedScalar alpha, const CeedInt N) { 343fc405b4SJames Wright for (CeedInt i = 0; i < N; i++) x[i] *= (x[i] < 0 ? alpha : 1.); 353fc405b4SJames Wright } 363fc405b4SJames Wright 37ad494f68SJames Wright CEED_QFUNCTION_HELPER void DataDrivenInference(const CeedScalar *inputs, CeedScalar *outputs, SgsDDContext sgsdd_ctx) { 383fc405b4SJames Wright const CeedInt num_neurons = sgsdd_ctx->num_neurons; 393fc405b4SJames Wright const CeedInt num_inputs = sgsdd_ctx->num_inputs; 403fc405b4SJames Wright const CeedInt num_outputs = sgsdd_ctx->num_outputs; 413fc405b4SJames Wright const CeedScalar alpha = sgsdd_ctx->alpha; 423fc405b4SJames Wright const CeedScalar *bias1 = &sgsdd_ctx->data[sgsdd_ctx->offsets.bias1]; 433fc405b4SJames Wright const CeedScalar *bias2 = &sgsdd_ctx->data[sgsdd_ctx->offsets.bias2]; 443fc405b4SJames Wright const CeedScalar *weight1 = &sgsdd_ctx->data[sgsdd_ctx->offsets.weight1]; 453fc405b4SJames Wright const CeedScalar *weight2 = &sgsdd_ctx->data[sgsdd_ctx->offsets.weight2]; 463fc405b4SJames Wright CeedScalar V[20] = {0.}; 473fc405b4SJames Wright 483fc405b4SJames Wright CopyN(bias1, V, num_neurons); 493fc405b4SJames Wright MatVecNM(weight1, inputs, num_neurons, num_inputs, CEED_NOTRANSPOSE, V); 503fc405b4SJames Wright LeakyReLU(V, alpha, num_neurons); 513fc405b4SJames Wright CopyN(bias2, outputs, num_outputs); 523fc405b4SJames Wright MatVecNM(weight2, V, num_outputs, num_neurons, CEED_NOTRANSPOSE, outputs); 533fc405b4SJames Wright } 543fc405b4SJames Wright 55ad494f68SJames Wright CEED_QFUNCTION_HELPER void ComputeSgsDD_Fused(const CeedScalar grad_velo_aniso[3][3], const CeedScalar km_A_ij[6], const CeedScalar delta, 56ad494f68SJames Wright const CeedScalar viscosity, CeedScalar kmsgs_stress[6], SgsDDContext sgsdd_ctx) { 57be75532aSJames Wright CeedScalar inputs[6], grad_velo_magnitude, eigenvectors[3][3], sgs_sframe_sym[6] = {0.}, new_bounds[6][2]; 58be75532aSJames Wright // Copying new_bounds because Sycl online compiler doesn't like direct casting the pointer 59be75532aSJames Wright CopyN(&sgsdd_ctx->data[sgsdd_ctx->offsets.out_scaling], (CeedScalar *)new_bounds, 12); 60db588195SJames Wright 61ad494f68SJames Wright ComputeSgsDDInputs(grad_velo_aniso, km_A_ij, delta, viscosity, eigenvectors, inputs, &grad_velo_magnitude); 623fc405b4SJames Wright DataDrivenInference(inputs, sgs_sframe_sym, sgsdd_ctx); 63ad494f68SJames Wright ComputeSgsDDOutputs(sgs_sframe_sym, delta, eigenvectors, new_bounds, grad_velo_magnitude, kmsgs_stress); 643fc405b4SJames Wright } 653fc405b4SJames Wright 66ee1455b7SJames Wright // @brief Calculate subgrid stress at nodes using anisotropic data-driven model 67ad494f68SJames Wright CEED_QFUNCTION_HELPER int ComputeSgsDDNodal_Fused(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out, 688fff8293SJames Wright StateVariable state_var) { 69ee1455b7SJames Wright const CeedScalar(*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0]; 70ee1455b7SJames Wright const CeedScalar(*grad_velo)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[2]; 71ee1455b7SJames Wright const CeedScalar(*A_ij_delta)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3]; 72ee1455b7SJames Wright const CeedScalar(*inv_multiplicity) = (const CeedScalar(*))in[4]; 73ee1455b7SJames Wright CeedScalar(*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0]; 74ee1455b7SJames Wright 75ad494f68SJames Wright const SgsDDContext sgsdd_ctx = (SgsDDContext)ctx; 76*cde3d787SJames Wright const NewtonianIGProperties gas = sgsdd_ctx->newt_ctx.gas; 77ee1455b7SJames Wright 78ee1455b7SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { 79ee1455b7SJames Wright const CeedScalar qi[5] = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]}; 80ee1455b7SJames Wright const CeedScalar grad_velo_aniso[3][3] = { 81ee1455b7SJames Wright {grad_velo[0][0][i], grad_velo[0][1][i], grad_velo[0][2][i]}, 82ee1455b7SJames Wright {grad_velo[1][0][i], grad_velo[1][1][i], grad_velo[1][2][i]}, 83ee1455b7SJames Wright {grad_velo[2][0][i], grad_velo[2][1][i], grad_velo[2][2][i]} 84ee1455b7SJames Wright }; 85ee1455b7SJames Wright const CeedScalar km_A_ij[6] = {A_ij_delta[0][i], A_ij_delta[1][i], A_ij_delta[2][i], A_ij_delta[3][i], A_ij_delta[4][i], A_ij_delta[5][i]}; 86ee1455b7SJames Wright const CeedScalar delta = A_ij_delta[6][i]; 87edcfef1bSKenneth E. Jansen const State s = StateFromQ(gas, qi, state_var); 88ee1455b7SJames Wright CeedScalar km_sgs[6]; 89ee1455b7SJames Wright 90*cde3d787SJames Wright ComputeSgsDD_Fused(grad_velo_aniso, km_A_ij, delta, gas.mu / s.U.density, km_sgs, sgsdd_ctx); 91ee1455b7SJames Wright 92ee1455b7SJames Wright for (int j = 0; j < 6; j++) v[j][i] = inv_multiplicity[i] * km_sgs[j]; 93ee1455b7SJames Wright } 94ee1455b7SJames Wright return 0; 95ee1455b7SJames Wright } 96ee1455b7SJames Wright 97ad494f68SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 98ad494f68SJames Wright return ComputeSgsDDNodal_Fused(ctx, Q, in, out, STATEVAR_PRIMITIVE); 99ee1455b7SJames Wright } 100ee1455b7SJames Wright 101ad494f68SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 102ad494f68SJames Wright return ComputeSgsDDNodal_Fused(ctx, Q, in, out, STATEVAR_CONSERVATIVE); 103ee1455b7SJames Wright } 104ee1455b7SJames Wright 1059b103f75SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Entropy)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 1069b103f75SJames Wright return ComputeSgsDDNodal_Fused(ctx, Q, in, out, STATEVAR_ENTROPY); 1079b103f75SJames Wright } 1089b103f75SJames Wright 1093ec34a3dSJames Wright // @brief Calculate inputs to anisotropic data-driven model 1103ec34a3dSJames Wright CEED_QFUNCTION_HELPER int ComputeSgsDDNodal_Sequential_Inputs(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out, 1113ec34a3dSJames Wright StateVariable state_var) { 1123ec34a3dSJames Wright const CeedScalar(*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0]; 1133ec34a3dSJames Wright const CeedScalar(*grad_velo)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[1]; 1143ec34a3dSJames Wright const CeedScalar(*A_ij_delta)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2]; 1153ec34a3dSJames Wright const CeedScalar(*inv_multiplicity) = (const CeedScalar(*))in[3]; 1163ec34a3dSJames Wright CeedScalar(*eigenvectors_stored) = out[0]; 1173ec34a3dSJames Wright CeedScalar(*model_inputs)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[1]; 1183ec34a3dSJames Wright 119b87d60b3SJames Wright const SgsDDContext sgsdd_ctx = (SgsDDContext)ctx; 120*cde3d787SJames Wright const NewtonianIGProperties gas = sgsdd_ctx->newt_ctx.gas; 1213ec34a3dSJames Wright 1223ec34a3dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { 1233ec34a3dSJames Wright const CeedScalar qi[5] = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]}; 1243ec34a3dSJames Wright const CeedScalar grad_velo_aniso[3][3] = { 1253ec34a3dSJames Wright {grad_velo[0][0][i], grad_velo[0][1][i], grad_velo[0][2][i]}, 1263ec34a3dSJames Wright {grad_velo[1][0][i], grad_velo[1][1][i], grad_velo[1][2][i]}, 1273ec34a3dSJames Wright {grad_velo[2][0][i], grad_velo[2][1][i], grad_velo[2][2][i]} 1283ec34a3dSJames Wright }; 1293ec34a3dSJames Wright const CeedScalar km_A_ij[6] = {A_ij_delta[0][i], A_ij_delta[1][i], A_ij_delta[2][i], A_ij_delta[3][i], A_ij_delta[4][i], A_ij_delta[5][i]}; 1303ec34a3dSJames Wright const CeedScalar delta = A_ij_delta[6][i]; 1313ec34a3dSJames Wright const State s = StateFromQ(gas, qi, state_var); 1323ec34a3dSJames Wright 1333ec34a3dSJames Wright CeedScalar model_inputs_i[6], grad_velo_magnitude, eigenvectors[3][3]; 134*cde3d787SJames Wright ComputeSgsDDInputs(grad_velo_aniso, km_A_ij, delta, gas.mu / s.U.density, eigenvectors, model_inputs_i, &grad_velo_magnitude); 1353ec34a3dSJames Wright 1363ec34a3dSJames Wright ScaleN(model_inputs_i, inv_multiplicity[i], 6); 1373ec34a3dSJames Wright StoredValuesPack(Q, i, 0, 6, model_inputs_i, (CeedScalar *)model_inputs); 1383ec34a3dSJames Wright StoredValuesPack(Q, i, 0, 9, (const CeedScalar *)eigenvectors, eigenvectors_stored); 139b87d60b3SJames Wright StoredValuesPack(Q, i, 9, 1, &grad_velo_magnitude, eigenvectors_stored); 1403ec34a3dSJames Wright } 1413ec34a3dSJames Wright return CEED_ERROR_SUCCESS; 1423ec34a3dSJames Wright } 1433ec34a3dSJames Wright 1443ec34a3dSJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inputs_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 1453ec34a3dSJames Wright return ComputeSgsDDNodal_Sequential_Inputs(ctx, Q, in, out, STATEVAR_PRIMITIVE); 1463ec34a3dSJames Wright } 1473ec34a3dSJames Wright 1483ec34a3dSJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inputs_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 1493ec34a3dSJames Wright return ComputeSgsDDNodal_Sequential_Inputs(ctx, Q, in, out, STATEVAR_CONSERVATIVE); 1503ec34a3dSJames Wright } 1513ec34a3dSJames Wright 1529b103f75SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inputs_Entropy)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 1539b103f75SJames Wright return ComputeSgsDDNodal_Sequential_Inputs(ctx, Q, in, out, STATEVAR_ENTROPY); 1549b103f75SJames Wright } 1559b103f75SJames Wright 156b87d60b3SJames Wright // @brief Runs inference on the data-driven model, used predominantsly for testing and validation 157b87d60b3SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Inference)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 158b87d60b3SJames Wright const CeedScalar(*model_inputs) = in[0]; 159b87d60b3SJames Wright const CeedScalar(*inv_multiplicity) = in[1]; 160b87d60b3SJames Wright CeedScalar(*model_outputs) = out[0]; 161b87d60b3SJames Wright 162b87d60b3SJames Wright const SgsDDContext sgsdd_ctx = (SgsDDContext)ctx; 163b87d60b3SJames Wright 164b87d60b3SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { 165b87d60b3SJames Wright CeedScalar model_inputs_i[6], model_outputs_i[6]; 166b87d60b3SJames Wright 167b87d60b3SJames Wright StoredValuesUnpack(Q, i, 0, 6, (const CeedScalar *)model_inputs, model_inputs_i); 168b87d60b3SJames Wright DataDrivenInference(model_inputs_i, model_outputs_i, sgsdd_ctx); 169b87d60b3SJames Wright ScaleN(model_outputs_i, inv_multiplicity[i], 6); 170b87d60b3SJames Wright StoredValuesPack(Q, i, 0, 6, model_outputs_i, model_outputs); 171b87d60b3SJames Wright } 172b87d60b3SJames Wright return CEED_ERROR_SUCCESS; 173b87d60b3SJames Wright } 174b87d60b3SJames Wright 1753ec34a3dSJames Wright // @brief Calculates SGS from outputs of anisotropic data-driven model 176b87d60b3SJames Wright CEED_QFUNCTION(ComputeSgsDDNodal_Sequential_Outputs)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 177b87d60b3SJames Wright const CeedScalar(*model_outputs) = in[0]; 178b87d60b3SJames Wright const CeedScalar(*A_ij_delta)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[1]; 179b87d60b3SJames Wright const CeedScalar(*inv_multiplicity) = (const CeedScalar(*))in[2]; 180b87d60b3SJames Wright const CeedScalar(*eigenvectors_stored) = in[3]; 1813ec34a3dSJames Wright CeedScalar(*kmsgs_stress)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0]; 1823ec34a3dSJames Wright 183b87d60b3SJames Wright const SgsDDContext sgsdd_ctx = (SgsDDContext)ctx; 1843ec34a3dSJames Wright CeedScalar new_bounds[6][2]; 1853ec34a3dSJames Wright CopyN(&sgsdd_ctx->data[sgsdd_ctx->offsets.out_scaling], (CeedScalar *)new_bounds, 12); 1863ec34a3dSJames Wright 1873ec34a3dSJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { 188b87d60b3SJames Wright CeedScalar model_outputs_i[6]; 1893ec34a3dSJames Wright const CeedScalar delta = A_ij_delta[6][i]; 1903ec34a3dSJames Wright 1913ec34a3dSJames Wright StoredValuesUnpack(Q, i, 0, 6, model_outputs, model_outputs_i); 1923ec34a3dSJames Wright CeedScalar grad_velo_magnitude, eigenvectors[3][3], kmsgs_stress_i[6]; 1933ec34a3dSJames Wright StoredValuesUnpack(Q, i, 0, 9, eigenvectors_stored, (CeedScalar *)eigenvectors); 194b87d60b3SJames Wright StoredValuesUnpack(Q, i, 9, 1, eigenvectors_stored, &grad_velo_magnitude); 1953ec34a3dSJames Wright ComputeSgsDDOutputs(model_outputs_i, delta, eigenvectors, new_bounds, grad_velo_magnitude, kmsgs_stress_i); 1963ec34a3dSJames Wright 1973ec34a3dSJames Wright for (int j = 0; j < 6; j++) kmsgs_stress[j][i] = inv_multiplicity[i] * kmsgs_stress_i[j]; 1983ec34a3dSJames Wright } 1993ec34a3dSJames Wright return CEED_ERROR_SUCCESS; 2003ec34a3dSJames Wright } 2013ec34a3dSJames Wright 2029c678832SJames Wright // @brief Adds subgrid stress to residual (during IFunction evaluation) 2039c678832SJames Wright CEED_QFUNCTION_HELPER int FluxSubgridStress(const StatePrimitive Y, const CeedScalar km_sgs[6], CeedScalar Flux[5][3]) { 2049c678832SJames Wright CeedScalar sgs[3][3]; 2059c678832SJames Wright 2069c678832SJames Wright KMUnpack(km_sgs, sgs); 2079c678832SJames Wright for (CeedInt j = 0; j < 3; j++) { 2089c678832SJames Wright Flux[0][j] = 0.; 2099c678832SJames Wright for (CeedInt k = 0; k < 3; k++) Flux[k + 1][j] = sgs[k][j]; 2109c678832SJames Wright Flux[4][j] = Y.velocity[0] * sgs[0][j] + Y.velocity[1] * sgs[1][j] + Y.velocity[2] * sgs[2][j]; 2119c678832SJames Wright } 2129c678832SJames Wright return 0; 2139c678832SJames Wright } 2149c678832SJames Wright 21542454adaSJames Wright CEED_QFUNCTION_HELPER int IFunction_NodalSgs(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out, StateVariable state_var) { 2169c678832SJames Wright const CeedScalar(*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0]; 217ade49511SJames Wright const CeedScalar(*q_data) = in[1]; 218e985bffbSJames Wright const CeedScalar(*km_sgs)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[2]; 2199c678832SJames Wright CeedScalar(*Grad_v)[5][CEED_Q_VLA] = (CeedScalar(*)[5][CEED_Q_VLA])out[0]; 2209c678832SJames Wright 221*cde3d787SJames Wright NewtonianIdealGasContext newt_ctx = (NewtonianIdealGasContext)ctx; 2229c678832SJames Wright 2239c678832SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { 2249c678832SJames Wright const CeedScalar qi[5] = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]}; 225*cde3d787SJames Wright const State s = StateFromQ(newt_ctx->gas, qi, state_var); 2269c678832SJames Wright 227ade49511SJames Wright CeedScalar wdetJ, dXdx[3][3]; 228ade49511SJames Wright QdataUnpack_3D(Q, i, q_data, &wdetJ, dXdx); 2299c678832SJames Wright 2309c678832SJames Wright CeedScalar Flux[5][3]; 2319c678832SJames Wright const CeedScalar km_sgs_i[6] = {km_sgs[0][i], km_sgs[1][i], km_sgs[2][i], km_sgs[3][i], km_sgs[4][i], km_sgs[5][i]}; 2329c678832SJames Wright FluxSubgridStress(s.Y, km_sgs_i, Flux); 2339c678832SJames Wright 2347523f6aaSJames Wright for (CeedInt k = 0; k < 3; k++) { 2357523f6aaSJames Wright for (CeedInt j = 0; j < 5; j++) { 2367523f6aaSJames Wright Grad_v[k][j][i] = -wdetJ * (dXdx[k][0] * Flux[j][0] + dXdx[k][1] * Flux[j][1] + dXdx[k][2] * Flux[j][2]); 2379c678832SJames Wright } 2389c678832SJames Wright } 2399c678832SJames Wright } 2409c678832SJames Wright return 0; 2419c678832SJames Wright } 2429c678832SJames Wright 24342454adaSJames Wright CEED_QFUNCTION(IFunction_NodalSgs_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 24442454adaSJames Wright return IFunction_NodalSgs(ctx, Q, in, out, STATEVAR_CONSERVATIVE); 2459c678832SJames Wright } 2469c678832SJames Wright 24742454adaSJames Wright CEED_QFUNCTION(IFunction_NodalSgs_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 24842454adaSJames Wright return IFunction_NodalSgs(ctx, Q, in, out, STATEVAR_PRIMITIVE); 2499c678832SJames Wright } 2509b103f75SJames Wright 2519b103f75SJames Wright CEED_QFUNCTION(IFunction_NodalSgs_Entropy)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 2529b103f75SJames Wright return IFunction_NodalSgs(ctx, Q, in, out, STATEVAR_ENTROPY); 2539b103f75SJames Wright } 254