162b7942eSJames Wright // Copyright (c) 2017-2023, Lawrence Livermore National Security, LLC and other CEED contributors. 262b7942eSJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 362b7942eSJames Wright // 462b7942eSJames Wright // SPDX-License-Identifier: BSD-2-Clause 562b7942eSJames Wright // 662b7942eSJames Wright // This file is part of CEED: http://github.com/ceed 762b7942eSJames Wright 862b7942eSJames Wright /// @file 962b7942eSJames Wright /// Structs and helper functions for data-driven subgrid-stress modeling 103fc405b4SJames Wright /// See 'Invariant data-driven subgrid stress modeling in the strain-rate eigenframe for large eddy simulation' 2022 and 'S-frame discrepancy 113fc405b4SJames Wright /// correction models for data-informed Reynolds stress closure' 2022 1262b7942eSJames Wright 1362b7942eSJames Wright #ifndef sgs_dd_model_h 1462b7942eSJames Wright #define sgs_dd_model_h 1562b7942eSJames Wright 1662b7942eSJames Wright #include <ceed.h> 1762b7942eSJames Wright 18*ee1455b7SJames Wright #include "newtonian_types.h" 193fc405b4SJames Wright #include "newtonian_state.h" 203fc405b4SJames Wright #include "utils.h" 213fc405b4SJames Wright #include "utils_eigensolver_jacobi.h" 223fc405b4SJames Wright 2362b7942eSJames Wright typedef struct SGS_DD_ModelContext_ *SGS_DDModelContext; 2462b7942eSJames Wright struct SGS_DD_ModelContext_ { 2562b7942eSJames Wright CeedInt num_inputs, num_outputs; 2662b7942eSJames Wright CeedInt num_layers; 2762b7942eSJames Wright CeedInt num_neurons; 2862b7942eSJames Wright CeedScalar alpha; 2962b7942eSJames Wright 30*ee1455b7SJames Wright struct NewtonianIdealGasContext_ gas; 3162b7942eSJames Wright struct { 3262b7942eSJames Wright size_t bias1, bias2; 3362b7942eSJames Wright size_t weight1, weight2; 3462b7942eSJames Wright size_t out_scaling; 3562b7942eSJames Wright } offsets; 3662b7942eSJames Wright size_t total_bytes; 3762b7942eSJames Wright CeedScalar data[1]; 3862b7942eSJames Wright }; 3962b7942eSJames Wright 403fc405b4SJames Wright // @brief Calculate the inverse of the multiplicity, reducing to a single component 413fc405b4SJames Wright CEED_QFUNCTION(InverseMultiplicity)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 423fc405b4SJames Wright const CeedScalar(*multiplicity)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0]; 433fc405b4SJames Wright CeedScalar(*inv_multiplicity) = (CeedScalar(*))out[0]; 443fc405b4SJames Wright 453fc405b4SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) inv_multiplicity[i] = 1.0 / multiplicity[0][i]; 463fc405b4SJames Wright return 0; 473fc405b4SJames Wright } 483fc405b4SJames Wright 493fc405b4SJames Wright // @brief Calculate Frobenius norm of velocity gradient from eigenframe quantities 503fc405b4SJames Wright CEED_QFUNCTION_HELPER CeedScalar VelocityGradientMagnitude(const CeedScalar strain_sframe[3], const CeedScalar vorticity_sframe[3]) { 513fc405b4SJames Wright return sqrt(Dot3(strain_sframe, strain_sframe) + 0.5 * Dot3(vorticity_sframe, vorticity_sframe)); 523fc405b4SJames Wright }; 533fc405b4SJames Wright 543fc405b4SJames Wright // @brief Denormalize outputs using min-max (de-)normalization 553fc405b4SJames Wright CEED_QFUNCTION_HELPER void DenormalizeDDOutputs(CeedScalar output[6], const CeedScalar new_bounds[6][2], const CeedScalar old_bounds[6][2]) { 563fc405b4SJames Wright CeedScalar bounds_ratio; 573fc405b4SJames Wright for (int i = 0; i < 6; i++) { 583fc405b4SJames Wright bounds_ratio = (new_bounds[i][1] - new_bounds[i][0]) / (old_bounds[i][1] - old_bounds[i][0]); 593fc405b4SJames Wright output[i] = bounds_ratio * (output[i] - old_bounds[i][1]) + new_bounds[i][1]; 603fc405b4SJames Wright } 613fc405b4SJames Wright } 623fc405b4SJames Wright 633fc405b4SJames Wright // @brief Change the order of basis vectors so that they align with vector and obey right-hand rule 643fc405b4SJames Wright // @details The e_1 and e_3 basis vectors are the closest aligned to the vector. The e_2 is set via e_3 x e_1 653fc405b4SJames Wright // The basis vectors are assumed to form the rows of the basis matrix. 663fc405b4SJames Wright CEED_QFUNCTION_HELPER void OrientBasisWithVector(CeedScalar basis[3][3], const CeedScalar vector[3]) { 673fc405b4SJames Wright CeedScalar alignment[3] = {0.}, cross[3]; 683fc405b4SJames Wright 693fc405b4SJames Wright MatVec3(basis, vector, CEED_NOTRANSPOSE, alignment); 703fc405b4SJames Wright 713fc405b4SJames Wright if (alignment[0] < 0) ScaleN(basis[0], -1, 3); 723fc405b4SJames Wright if (alignment[2] < 0) ScaleN(basis[2], -1, 3); 733fc405b4SJames Wright 743fc405b4SJames Wright Cross3(basis[2], basis[0], cross); 753fc405b4SJames Wright CeedScalar basis_1_orientation = Dot3(cross, basis[1]); 763fc405b4SJames Wright if (basis_1_orientation < 0) ScaleN(basis[1], -1, 3); 773fc405b4SJames Wright } 783fc405b4SJames Wright 793fc405b4SJames Wright CEED_QFUNCTION_HELPER void LeakyReLU(CeedScalar *x, const CeedScalar alpha, const CeedInt N) { 803fc405b4SJames Wright for (CeedInt i = 0; i < N; i++) x[i] *= (x[i] < 0 ? alpha : 1.); 813fc405b4SJames Wright } 823fc405b4SJames Wright 833fc405b4SJames Wright CEED_QFUNCTION_HELPER void DataDrivenInference(const CeedScalar *inputs, CeedScalar *outputs, SGS_DDModelContext sgsdd_ctx) { 843fc405b4SJames Wright const CeedInt num_neurons = sgsdd_ctx->num_neurons; 853fc405b4SJames Wright const CeedInt num_inputs = sgsdd_ctx->num_inputs; 863fc405b4SJames Wright const CeedInt num_outputs = sgsdd_ctx->num_outputs; 873fc405b4SJames Wright const CeedScalar alpha = sgsdd_ctx->alpha; 883fc405b4SJames Wright const CeedScalar *bias1 = &sgsdd_ctx->data[sgsdd_ctx->offsets.bias1]; 893fc405b4SJames Wright const CeedScalar *bias2 = &sgsdd_ctx->data[sgsdd_ctx->offsets.bias2]; 903fc405b4SJames Wright const CeedScalar *weight1 = &sgsdd_ctx->data[sgsdd_ctx->offsets.weight1]; 913fc405b4SJames Wright const CeedScalar *weight2 = &sgsdd_ctx->data[sgsdd_ctx->offsets.weight2]; 923fc405b4SJames Wright CeedScalar V[20] = {0.}; 933fc405b4SJames Wright 943fc405b4SJames Wright CopyN(bias1, V, num_neurons); 953fc405b4SJames Wright MatVecNM(weight1, inputs, num_neurons, num_inputs, CEED_NOTRANSPOSE, V); 963fc405b4SJames Wright LeakyReLU(V, alpha, num_neurons); 973fc405b4SJames Wright CopyN(bias2, outputs, num_outputs); 983fc405b4SJames Wright MatVecNM(weight2, V, num_outputs, num_neurons, CEED_NOTRANSPOSE, outputs); 993fc405b4SJames Wright } 1003fc405b4SJames Wright 1013fc405b4SJames Wright CEED_QFUNCTION_HELPER void ComputeSGS_DDAnisotropic(const CeedScalar grad_velo_aniso[3][3], const CeedScalar km_A_ij[6], const CeedScalar delta, 1023fc405b4SJames Wright const CeedScalar viscosity, CeedScalar kmsgs_stress[6], SGS_DDModelContext sgsdd_ctx) { 1033fc405b4SJames Wright CeedScalar strain_sframe[3] = {0.}, vorticity_sframe[3] = {0.}, eigenvectors[3][3]; 1043fc405b4SJames Wright CeedScalar A_ij[3][3] = {{0.}}, grad_velo_iso[3][3] = {{0.}}; 1053fc405b4SJames Wright 1063fc405b4SJames Wright // -- Unpack anisotropy tensor 1073fc405b4SJames Wright KMUnpack(km_A_ij, A_ij); 1083fc405b4SJames Wright 1093fc405b4SJames Wright // -- Transform physical, anisotropic velocity gradient to isotropic 1103fc405b4SJames Wright MatMat3(grad_velo_aniso, A_ij, CEED_NOTRANSPOSE, CEED_NOTRANSPOSE, grad_velo_iso); 1113fc405b4SJames Wright 1123fc405b4SJames Wright { // -- Get Eigenframe 1133fc405b4SJames Wright CeedScalar kmstrain_iso[6], strain_iso[3][3]; 1143fc405b4SJames Wright CeedInt work_vector[3] = {0}; 1153fc405b4SJames Wright KMStrainRate(grad_velo_iso, kmstrain_iso); 1163fc405b4SJames Wright KMUnpack(kmstrain_iso, strain_iso); 1173fc405b4SJames Wright Diagonalize3(strain_iso, strain_sframe, eigenvectors, work_vector, SORT_DECREASING_EVALS, true, 5); 1183fc405b4SJames Wright } 1193fc405b4SJames Wright 1203fc405b4SJames Wright { // -- Get vorticity in S-frame 1213fc405b4SJames Wright CeedScalar rotation_iso[3][3]; 1223fc405b4SJames Wright RotationRate(grad_velo_iso, rotation_iso); 1233fc405b4SJames Wright CeedScalar vorticity_iso[3] = {-2 * rotation_iso[1][2], 2 * rotation_iso[0][2], -2 * rotation_iso[0][1]}; 1243fc405b4SJames Wright OrientBasisWithVector(eigenvectors, vorticity_iso); 1253fc405b4SJames Wright MatVec3(eigenvectors, vorticity_iso, CEED_NOTRANSPOSE, vorticity_sframe); 1263fc405b4SJames Wright } 1273fc405b4SJames Wright 1283fc405b4SJames Wright // -- Setup DD model inputs 1293fc405b4SJames Wright const CeedScalar grad_velo_magnitude = VelocityGradientMagnitude(strain_sframe, vorticity_sframe); 1303fc405b4SJames Wright CeedScalar inputs[6] = {strain_sframe[0], strain_sframe[1], strain_sframe[2], vorticity_sframe[0], vorticity_sframe[1], viscosity / Square(delta)}; 1313fc405b4SJames Wright ScaleN(inputs, 1 / (grad_velo_magnitude + CEED_EPSILON), 6); 1323fc405b4SJames Wright 1333fc405b4SJames Wright CeedScalar sgs_sframe_sym[6] = {0.}; 1343fc405b4SJames Wright DataDrivenInference(inputs, sgs_sframe_sym, sgsdd_ctx); 1353fc405b4SJames Wright 1363fc405b4SJames Wright CeedScalar old_bounds[6][2] = {{0}}; 1373fc405b4SJames Wright for (int j = 0; j < 6; j++) old_bounds[j][1] = 1; 1383fc405b4SJames Wright const CeedScalar(*new_bounds)[2] = (const CeedScalar(*)[2]) & sgsdd_ctx->data[sgsdd_ctx->offsets.out_scaling]; 1393fc405b4SJames Wright DenormalizeDDOutputs(sgs_sframe_sym, new_bounds, old_bounds); 1403fc405b4SJames Wright 1413fc405b4SJames Wright // Re-dimensionalize sgs_stress 1423fc405b4SJames Wright ScaleN(sgs_sframe_sym, Square(delta) * Square(grad_velo_magnitude), 6); 1433fc405b4SJames Wright 1443fc405b4SJames Wright CeedScalar sgs_stress[3][3] = {{0.}}; 1453fc405b4SJames Wright { // Rotate SGS Stress back to physical frame, SGS_physical = E^T SGS_sframe E 1463fc405b4SJames Wright CeedScalar Evec_sgs[3][3] = {{0.}}; 1473fc405b4SJames Wright const CeedScalar sgs_sframe[3][3] = { 1483fc405b4SJames Wright {sgs_sframe_sym[0], sgs_sframe_sym[3], sgs_sframe_sym[4]}, 1493fc405b4SJames Wright {sgs_sframe_sym[3], sgs_sframe_sym[1], sgs_sframe_sym[5]}, 1503fc405b4SJames Wright {sgs_sframe_sym[4], sgs_sframe_sym[5], sgs_sframe_sym[2]}, 1513fc405b4SJames Wright }; 1523fc405b4SJames Wright MatMat3(eigenvectors, sgs_sframe, CEED_TRANSPOSE, CEED_NOTRANSPOSE, Evec_sgs); 1533fc405b4SJames Wright MatMat3(Evec_sgs, eigenvectors, CEED_NOTRANSPOSE, CEED_NOTRANSPOSE, sgs_stress); 1543fc405b4SJames Wright } 1553fc405b4SJames Wright 1563fc405b4SJames Wright KMPack(sgs_stress, kmsgs_stress); 1573fc405b4SJames Wright } 1583fc405b4SJames Wright 159*ee1455b7SJames Wright // @brief Calculate subgrid stress at nodes using anisotropic data-driven model 160*ee1455b7SJames Wright CEED_QFUNCTION_HELPER int ComputeSGS_DDAnisotropicNodal(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out, 161*ee1455b7SJames Wright StateFromQi_t StateFromQi) { 162*ee1455b7SJames Wright const CeedScalar(*q)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[0]; 163*ee1455b7SJames Wright const CeedScalar(*x)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[1]; 164*ee1455b7SJames Wright const CeedScalar(*grad_velo)[3][CEED_Q_VLA] = (const CeedScalar(*)[3][CEED_Q_VLA])in[2]; 165*ee1455b7SJames Wright const CeedScalar(*A_ij_delta)[CEED_Q_VLA] = (const CeedScalar(*)[CEED_Q_VLA])in[3]; 166*ee1455b7SJames Wright const CeedScalar(*inv_multiplicity) = (const CeedScalar(*))in[4]; 167*ee1455b7SJames Wright CeedScalar(*v)[CEED_Q_VLA] = (CeedScalar(*)[CEED_Q_VLA])out[0]; 168*ee1455b7SJames Wright 169*ee1455b7SJames Wright const SGS_DDModelContext sgsdd_ctx = (SGS_DDModelContext)ctx; 170*ee1455b7SJames Wright const NewtonianIdealGasContext gas = &sgsdd_ctx->gas; 171*ee1455b7SJames Wright 172*ee1455b7SJames Wright CeedPragmaSIMD for (CeedInt i = 0; i < Q; i++) { 173*ee1455b7SJames Wright const CeedScalar qi[5] = {q[0][i], q[1][i], q[2][i], q[3][i], q[4][i]}; 174*ee1455b7SJames Wright const CeedScalar x_i[3] = {x[0][i], x[1][i], x[2][i]}; 175*ee1455b7SJames Wright const CeedScalar grad_velo_aniso[3][3] = { 176*ee1455b7SJames Wright {grad_velo[0][0][i], grad_velo[0][1][i], grad_velo[0][2][i]}, 177*ee1455b7SJames Wright {grad_velo[1][0][i], grad_velo[1][1][i], grad_velo[1][2][i]}, 178*ee1455b7SJames Wright {grad_velo[2][0][i], grad_velo[2][1][i], grad_velo[2][2][i]} 179*ee1455b7SJames Wright }; 180*ee1455b7SJames Wright const CeedScalar km_A_ij[6] = {A_ij_delta[0][i], A_ij_delta[1][i], A_ij_delta[2][i], A_ij_delta[3][i], A_ij_delta[4][i], A_ij_delta[5][i]}; 181*ee1455b7SJames Wright const CeedScalar delta = A_ij_delta[6][i]; 182*ee1455b7SJames Wright const State s = StateFromQi(gas, qi, x_i); 183*ee1455b7SJames Wright CeedScalar km_sgs[6]; 184*ee1455b7SJames Wright 185*ee1455b7SJames Wright ComputeSGS_DDAnisotropic(grad_velo_aniso, km_A_ij, delta, gas->mu / s.U.density, km_sgs, sgsdd_ctx); 186*ee1455b7SJames Wright 187*ee1455b7SJames Wright for (int j = 0; j < 6; j++) v[j][i] = inv_multiplicity[i] * km_sgs[j]; 188*ee1455b7SJames Wright } 189*ee1455b7SJames Wright return 0; 190*ee1455b7SJames Wright } 191*ee1455b7SJames Wright 192*ee1455b7SJames Wright CEED_QFUNCTION(ComputeSGS_DDAnisotropicNodal_Prim)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 193*ee1455b7SJames Wright return ComputeSGS_DDAnisotropicNodal(ctx, Q, in, out, StateFromY); 194*ee1455b7SJames Wright } 195*ee1455b7SJames Wright 196*ee1455b7SJames Wright CEED_QFUNCTION(ComputeSGS_DDAnisotropicNodal_Conserv)(void *ctx, CeedInt Q, const CeedScalar *const *in, CeedScalar *const *out) { 197*ee1455b7SJames Wright return ComputeSGS_DDAnisotropicNodal(ctx, Q, in, out, StateFromU); 198*ee1455b7SJames Wright } 199*ee1455b7SJames Wright 20062b7942eSJames Wright #endif // sgs_dd_model_h 201