1149fb536SJames Wright // Copyright (c) 2017-2024, Lawrence Livermore National Security, LLC and other CEED contributors. 2149fb536SJames Wright // All Rights Reserved. See the top-level LICENSE and NOTICE files for details. 3149fb536SJames Wright // 4149fb536SJames Wright // SPDX-License-Identifier: BSD-2-Clause 5149fb536SJames Wright // 6149fb536SJames Wright // This file is part of CEED: http://github.com/ceed 7149fb536SJames Wright 8149fb536SJames Wright // libCEED + PETSc Example: Navier-Stokes 9149fb536SJames Wright // 10149fb536SJames Wright // This example demonstrates a simple usage of libCEED with PETSc to solve a Navier-Stokes problem. 11149fb536SJames Wright // 12149fb536SJames Wright // Build with: 13149fb536SJames Wright // 14149fb536SJames Wright // make [PETSC_DIR=</path/to/petsc>] [CEED_DIR=</path/to/libceed>] navierstokes 15149fb536SJames Wright // 16149fb536SJames Wright // Sample runs: 17149fb536SJames Wright // 18149fb536SJames Wright // ./navierstokes -ceed /cpu/self -options_file gaussianwave.yml 19149fb536SJames Wright // ./navierstokes -ceed /gpu/cuda -problem advection -degree 1 20149fb536SJames Wright // 21149fb536SJames Wright //TESTARGS(name="Newtonian and Riemann Solver Unit Tests",only="cpu") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 1e100 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-IDL-entropy.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 0 -newtonian_unit_tests -riemann_solver_unit_tests 22149fb536SJames Wright //TESTARGS(name="Gaussian Wave, IDL and Entropy variables") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-IDL-entropy.bin -state_var entropy -dm_plex_box_faces 5,5,1 -ts_max_steps 5 -idl_decay_time 2e-3 -idl_length 0.25 -idl_start 0 -idl_pressure 70 23*5ba826a2SJames Wright //TESTARGS(name="Blasius, SGS DataDriven Sequential Torch",only="torch") -ceed {ceed_resource} -options_file tests/blasius_stgtest.yaml -sgs_model_type data_driven -sgs_model_dd_leakyrelu_alpha 0.3 -sgs_model_dd_parameter_dir examples/dd_sgs_data -ts_dt 2e-9 -state_var primitive -ksp_rtol 1e-12 -snes_rtol 1e-12 -stg_mean_only -stg_fluctuating_IC -test_type solver -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-sgs-data-driven.bin -sgs_model_dd_implementation sequential_torch -sgs_model_dd_torch_model_path ./tests/createPyTorchModel/NNModel_HIT_fp64_jit.pt 24*5ba826a2SJames Wright //TESTARGS(name="Blasius, SGS DataDriven Sequential Ceed") -ceed {ceed_resource} -options_file tests/blasius_stgtest.yaml -sgs_model_type data_driven -sgs_model_dd_leakyrelu_alpha 0.3 -sgs_model_dd_parameter_dir examples/dd_sgs_data -ts_dt 2e-9 -state_var primitive -ksp_rtol 1e-12 -snes_rtol 1e-12 -stg_mean_only -stg_fluctuating_IC -test_type solver -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-sgs-data-driven.bin -sgs_model_dd_implementation sequential_ceed 25149fb536SJames Wright //TESTARGS(name="Gaussian Wave, explicit, supg, IDL") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 1e-8 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-explicit.bin -dm_plex_box_faces 2,2,1 -ts_max_steps 5 -degree 3 -implicit false -ts_type rk -stab supg -state_var conservative -mass_ksp_type gmres -mass_pc_jacobi_type diagonal -idl_decay_time 2e-3 -idl_length 0.25 -idl_start 0 -idl_pressure 70 26149fb536SJames Wright //TESTARGS(name="Advection 2D, rotation, explicit, supg, consistent mass") -ceed {ceed_resource} -test_type solver -problem advection -degree 3 -dm_plex_box_faces 2,2 -dm_plex_box_lower 0,0 -dm_plex_box_upper 125,125 -bc_wall 1,2,3,4 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ts_dt 1e-3 -ts_max_steps 10 -stab supg -Ctaus 0.5 -mass_ksp_type gmres -mass_pc_type vpbjacobi -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-adv2d-rotation-explicit-stab-supg-consistent-mass.bin 27149fb536SJames Wright //TESTARGS(name="Advection, skew") -ceed {ceed_resource} -test_type solver -options_file examples/advection.yaml -ts_max_steps 5 -wind_type translation -wind_translation -0.5547002,0.83205029,0 -advection_ic_type skew -dm_plex_box_faces 2,1,1 -degree 2 -stab supg -stab_tau advdiff_shakib -Ctau_a 4 -ksp_type gmres -diffusion_coeff 5e-4 -compare_final_state_atol 7e-10 -compare_final_state_filename tests/output/fluids-navierstokes-adv-skew.bin 28149fb536SJames Wright //TESTARGS(name="Blasius, bc_slip") -ceed {ceed_resource} -test_type solver -options_file examples/blasius.yaml -ts_max_steps 5 -dm_plex_box_faces 3,20,1 -platemesh_nDelta 10 -platemesh_growth 1.2 -bc_outflow 5 -bc_slip 4 -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-bc_slip.bin 29149fb536SJames Wright //TESTARGS(name="Advection, rotation, cosine") -ceed {ceed_resource} -test_type solver -options_file examples/advection.yaml -ts_max_steps 0 -advection_ic_type cosine_hill -dm_plex_box_faces 2,1,1 -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-adv-rotation-cosine.bin 30149fb536SJames Wright //TESTARGS(name="Gaussian Wave, using MatShell") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 1e-8 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-shell.bin -dm_plex_box_faces 2,2,1 -ts_max_steps 5 -degree 3 -amat_type shell -pc_type vpbjacobi -ts_alpha_radius 0.5 31149fb536SJames Wright //TESTARGS(name="Taylor-Green Vortex IC") -ceed {ceed_resource} -problem taylor_green -test_type solver -dm_plex_dim 3 -dm_plex_box_faces 6,6,6 -ts_max_steps 0 -compare_final_state_atol 1e-12 -compare_final_state_filename tests/output/fluids-navierstokes-taylor-green-IC.bin 32*5ba826a2SJames Wright //TESTARGS(name="Blasius, SGS DataDriven Fused") -ceed {ceed_resource} -options_file tests/blasius_stgtest.yaml -sgs_model_type data_driven -sgs_model_dd_leakyrelu_alpha 0.3 -sgs_model_dd_parameter_dir examples/dd_sgs_data -ts_dt 2e-9 -state_var primitive -ksp_rtol 1e-12 -snes_rtol 1e-12 -stg_mean_only -stg_fluctuating_IC -test_type solver -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-sgs-data-driven.bin 33149fb536SJames Wright //TESTARGS(name="Blasius, Anisotropic Differential Filter") -ceed {ceed_resource} -test_type diff_filter -options_file tests/blasius_test.yaml -compare_final_state_atol 5e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_diff_filter_aniso_vandriest.bin -diff_filter_monitor -ts_max_steps 0 -state_var primitive -diff_filter_friction_length 1e-5 -diff_filter_wall_damping_function van_driest -diff_filter_ksp_rtol 1e-8 -diff_filter_grid_based_width -diff_filter_width_scaling 1,0.7,1 34149fb536SJames Wright //TESTARGS(name="Blasius, Isotropic Differential Filter") -ceed {ceed_resource} -test_type diff_filter -options_file tests/blasius_test.yaml -compare_final_state_atol 2e-12 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_diff_filter_iso.bin -diff_filter_monitor -ts_max_steps 0 -diff_filter_width_scaling 4.2e-5,4.2e-5,4.2e-5 -diff_filter_ksp_atol 1e-14 -diff_filter_ksp_rtol 1e-16 35149fb536SJames Wright //TESTARGS(name="Gaussian Wave, with IDL") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-IDL.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 5 -idl_decay_time 2e-3 -idl_length 0.25 -idl_start 0 -ts_alpha_radius 0.5 -idl_pressure 70 36149fb536SJames Wright //TESTARGS(name="Spanwise Turbulence Statistics") -ceed {ceed_resource} -test_type turb_spanstats -options_file tests/stats_test.yaml -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-turb-spanstats-stats.bin 37149fb536SJames Wright //TESTARGS(name="Blasius") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_test.yaml -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius.bin 38149fb536SJames Wright //TESTARGS(name="Blasius, STG Inflow") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_stgtest.yaml -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_STG.bin 39149fb536SJames Wright //TESTARGS(name="Blasius, STG Inflow, Weak Temperature") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_stgtest.yaml -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_STG_weakT.bin -weakT 40149fb536SJames Wright //TESTARGS(name="Blasius, Strong STG Inflow") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_stgtest.yaml -compare_final_state_atol 1E-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_STG_strongBC.bin -stg_strong true 41149fb536SJames Wright //TESTARGS(name="Channel") -ceed {ceed_resource} -test_type solver -options_file examples/channel.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-channel.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 5 42149fb536SJames Wright //TESTARGS(name="Channel, Primitive") -ceed {ceed_resource} -test_type solver -options_file examples/channel.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-channel-prim.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 5 -state_var primitive 43149fb536SJames Wright //TESTARGS(name="Density Current, explicit") -ceed {ceed_resource} -test_type solver -degree 3 -q_extra 2 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -bc_symmetry_x 5,6 -bc_symmetry_y 3,4 -bc_symmetry_z 1,2 -units_kilogram 1e-9 -center 62.5,62.5,187.5 -rc 100. -thetaC -35. -mu 75 -gravity 0,0,-9.81 -ts_dt 1e-3 -units_meter 1e-2 -units_second 1e-2 -ts_max_steps 10 -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-dc-explicit.bin 44149fb536SJames Wright //TESTARGS(name="Density Current, implicit, no stabilization") -ceed {ceed_resource} -test_type solver -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -bc_symmetry_x 5,6 -bc_symmetry_y 3,4 -bc_symmetry_z 1,2 -units_kilogram 1e-9 -center 62.5,62.5,187.5 -rc 100. -thetaC -35. -mu 75 -gravity 0,0,-9.81 -units_meter 1e-2 -units_second 1e-2 -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -ts_type alpha -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-dc-implicit-stab-none.bin 45149fb536SJames Wright //TESTARGS(name="Advection, rotation, implicit, SUPG stabilization") -ceed {ceed_resource} -test_type solver -problem advection -CtauS .3 -stab supg -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -bc_wall 1,2,3,4,5,6 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -compare_final_state_atol 5E-4 -ts_max_steps 10 -compare_final_state_filename tests/output/fluids-navierstokes-adv-rotation-implicit-stab-supg.bin 46149fb536SJames Wright //TESTARGS(name="Advection, translation, implicit, SU stabilization") -ceed {ceed_resource} -test_type solver -problem advection -CtauS .3 -stab su -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -units_kilogram 1e-9 -rc 100. -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -wind_type translation -wind_translation .53,-1.33,-2.65 -bc_inflow 1,2,3,4,5,6 -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-adv-translation-implicit-stab-su.bin 47149fb536SJames Wright //TESTARGS(name="Advection 2D, rotation, explicit, strong form") -ceed {ceed_resource} -test_type solver -problem advection -strong_form 1 -degree 3 -dm_plex_box_faces 2,2 -dm_plex_box_lower 0,0 -dm_plex_box_upper 125,125 -bc_wall 1,2,3,4 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ts_dt 1e-3 -compare_final_state_atol 5E-11 -ts_max_steps 10 -compare_final_state_filename tests/output/fluids-navierstokes-adv2d-rotation-explicit-strong.bin 48149fb536SJames Wright //TESTARGS(name="Advection 2D, rotation, implicit, SUPG stabilization") -ceed {ceed_resource} -test_type solver -problem advection -CtauS .3 -stab supg -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0 -dm_plex_box_upper 125,125 -bc_wall 1,2,3,4 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-adv2d-rotation-implicit-stab-supg.bin 49149fb536SJames Wright //TESTARGS(name="Euler, implicit") -ceed {ceed_resource} -test_type solver -problem euler_vortex -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -units_meter 1e-4 -units_second 1e-4 -mean_velocity 1.4,-2.,0 -bc_inflow 4,6 -bc_outflow 3,5 -bc_symmetry_z 1,2 -vortex_strength 2 -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-euler-implicit.bin 50149fb536SJames Wright //TESTARGS(name="Euler, explicit") -ceed {ceed_resource} -test_type solver -problem euler_vortex -degree 3 -q_extra 2 -dm_plex_box_faces 2,2,1 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -units_meter 1e-4 -units_second 1e-4 -mean_velocity 1.4,-2.,0 -bc_inflow 4,6 -bc_outflow 3,5 -bc_symmetry_z 1,2 -vortex_strength 2 -ts_dt 1e-7 -ts_rk_type 5bs -ts_rtol 1e-10 -ts_atol 1e-10 -ts_max_steps 10 -compare_final_state_atol 1E-7 -compare_final_state_filename tests/output/fluids-navierstokes-euler-explicit.bin 51149fb536SJames Wright //TESTARGS(name="Sod Shocktube, explicit, SU stabilization, y-z-beta shock capturing") -ceed {ceed_resource} -test_type solver -problem shocktube -degree 1 -q_extra 2 -dm_plex_box_faces 50,1,1 -units_meter 1e-2 units_second 1e-2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 1000,20,20 -dm_plex_dim 3 -bc_symmetry_x 5,6 -bc_symmetry_y 3,4 -bc_symmetry_z 1,2 -yzb -stab su -ts_max_steps 10 -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-shocktube-explicit-su-yzb.bin 52149fb536SJames Wright 53149fb536SJames Wright /// @file 54149fb536SJames Wright /// Navier-Stokes example using PETSc 55149fb536SJames Wright 56149fb536SJames Wright const char help[] = "Solve Navier-Stokes using PETSc and libCEED\n"; 57149fb536SJames Wright 58149fb536SJames Wright #include <navierstokes.h> 59149fb536SJames Wright #include <petscdevice.h> 60149fb536SJames Wright 61149fb536SJames Wright #include <ceed.h> 62149fb536SJames Wright #include <petscdmplex.h> 63149fb536SJames Wright #include <petscts.h> 64149fb536SJames Wright 65149fb536SJames Wright int main(int argc, char **argv) { 66149fb536SJames Wright // --------------------------------------------------------------------------- 67149fb536SJames Wright // Initialize PETSc 68149fb536SJames Wright // --------------------------------------------------------------------------- 69149fb536SJames Wright PetscCall(PetscInitialize(&argc, &argv, NULL, help)); 70149fb536SJames Wright 71149fb536SJames Wright // --------------------------------------------------------------------------- 72149fb536SJames Wright // Create structs 73149fb536SJames Wright // --------------------------------------------------------------------------- 74149fb536SJames Wright AppCtx app_ctx; 75149fb536SJames Wright PetscCall(PetscCalloc1(1, &app_ctx)); 76149fb536SJames Wright 77149fb536SJames Wright ProblemData problem; 78149fb536SJames Wright PetscCall(PetscCalloc1(1, &problem)); 79149fb536SJames Wright 80149fb536SJames Wright User user; 81149fb536SJames Wright PetscCall(PetscCalloc1(1, &user)); 82149fb536SJames Wright 83149fb536SJames Wright CeedData ceed_data; 84149fb536SJames Wright PetscCall(PetscCalloc1(1, &ceed_data)); 85149fb536SJames Wright 86149fb536SJames Wright SimpleBC bc; 87149fb536SJames Wright PetscCall(PetscCalloc1(1, &bc)); 88149fb536SJames Wright 89149fb536SJames Wright Physics phys_ctx; 90149fb536SJames Wright PetscCall(PetscCalloc1(1, &phys_ctx)); 91149fb536SJames Wright 92149fb536SJames Wright Units units; 93149fb536SJames Wright PetscCall(PetscCalloc1(1, &units)); 94149fb536SJames Wright 95149fb536SJames Wright user->app_ctx = app_ctx; 96149fb536SJames Wright user->units = units; 97149fb536SJames Wright user->phys = phys_ctx; 98149fb536SJames Wright problem->set_bc_from_ics = PETSC_TRUE; 99149fb536SJames Wright 100149fb536SJames Wright PetscCall(RegisterLogEvents()); 101149fb536SJames Wright 102149fb536SJames Wright // --------------------------------------------------------------------------- 103149fb536SJames Wright // Process command line options 104149fb536SJames Wright // --------------------------------------------------------------------------- 105149fb536SJames Wright // -- Register problems to be available on the command line 106149fb536SJames Wright PetscCall(RegisterProblems_NS(app_ctx)); 107149fb536SJames Wright 108149fb536SJames Wright // -- Process general command line options 109149fb536SJames Wright MPI_Comm comm = PETSC_COMM_WORLD; 110149fb536SJames Wright user->comm = comm; 111149fb536SJames Wright PetscCall(ProcessCommandLineOptions(comm, app_ctx, bc)); 112149fb536SJames Wright PetscCall(BoundaryConditionSetUp(user, problem, app_ctx, bc)); 113149fb536SJames Wright 114149fb536SJames Wright // --------------------------------------------------------------------------- 115149fb536SJames Wright // Initialize libCEED 116149fb536SJames Wright // --------------------------------------------------------------------------- 117149fb536SJames Wright // -- Initialize backend 118149fb536SJames Wright Ceed ceed; 119149fb536SJames Wright PetscCheck(CeedInit(app_ctx->ceed_resource, &ceed) == CEED_ERROR_SUCCESS, comm, PETSC_ERR_LIB, "Ceed initialization failed"); 120149fb536SJames Wright user->ceed = ceed; 121149fb536SJames Wright 122149fb536SJames Wright PetscCheck(CeedSetErrorHandler(ceed, CeedErrorStore) == CEED_ERROR_SUCCESS, comm, PETSC_ERR_LIB, "Setting libCEED error handler failed"); 123149fb536SJames Wright 124149fb536SJames Wright // -- Check preferred MemType 125149fb536SJames Wright CeedMemType mem_type_backend; 126149fb536SJames Wright PetscCallCeed(ceed, CeedGetPreferredMemType(ceed, &mem_type_backend)); 127149fb536SJames Wright 128149fb536SJames Wright { 129149fb536SJames Wright const char *resource; 130149fb536SJames Wright PetscCallCeed(ceed, CeedGetResource(ceed, &resource)); 131149fb536SJames Wright if (strstr(resource, "/gpu/sycl")) { 132149fb536SJames Wright PetscDeviceContext dctx; 133149fb536SJames Wright PetscCall(PetscDeviceContextGetCurrentContext(&dctx)); 134149fb536SJames Wright void *stream_handle; 135149fb536SJames Wright PetscCall(PetscDeviceContextGetStreamHandle(dctx, &stream_handle)); 136149fb536SJames Wright PetscCallCeed(ceed, CeedSetStream(ceed, stream_handle)); 137149fb536SJames Wright } 138149fb536SJames Wright } 139149fb536SJames Wright 140149fb536SJames Wright // --------------------------------------------------------------------------- 141149fb536SJames Wright // Set up global mesh 142149fb536SJames Wright // --------------------------------------------------------------------------- 143149fb536SJames Wright // -- Create DM 144149fb536SJames Wright DM dm; 145149fb536SJames Wright VecType vec_type = NULL; 146149fb536SJames Wright MatType mat_type = NULL; 147149fb536SJames Wright switch (mem_type_backend) { 148149fb536SJames Wright case CEED_MEM_HOST: 149149fb536SJames Wright vec_type = VECSTANDARD; 150149fb536SJames Wright break; 151149fb536SJames Wright case CEED_MEM_DEVICE: { 152149fb536SJames Wright const char *resolved; 153149fb536SJames Wright PetscCallCeed(ceed, CeedGetResource(ceed, &resolved)); 154149fb536SJames Wright if (strstr(resolved, "/gpu/cuda")) vec_type = VECCUDA; 155149fb536SJames Wright else if (strstr(resolved, "/gpu/hip")) vec_type = VECKOKKOS; 156149fb536SJames Wright else if (strstr(resolved, "/gpu/sycl")) vec_type = VECKOKKOS; 157149fb536SJames Wright else vec_type = VECSTANDARD; 158149fb536SJames Wright } 159149fb536SJames Wright } 160149fb536SJames Wright if (strstr(vec_type, VECCUDA)) mat_type = MATAIJCUSPARSE; 161149fb536SJames Wright else if (strstr(vec_type, VECKOKKOS)) mat_type = MATAIJKOKKOS; 162149fb536SJames Wright else mat_type = MATAIJ; 163149fb536SJames Wright PetscCall(CreateDM(comm, problem, mat_type, vec_type, &dm)); 164149fb536SJames Wright user->dm = dm; 165149fb536SJames Wright PetscCall(DMSetApplicationContext(dm, user)); 166149fb536SJames Wright 167149fb536SJames Wright // --------------------------------------------------------------------------- 168149fb536SJames Wright // Choose the problem from the list of registered problems 169149fb536SJames Wright // --------------------------------------------------------------------------- 170149fb536SJames Wright { 171149fb536SJames Wright PetscErrorCode (*p)(ProblemData, DM, void *, SimpleBC); 172149fb536SJames Wright PetscCall(PetscFunctionListFind(app_ctx->problems, app_ctx->problem_name, &p)); 173149fb536SJames Wright PetscCheck(p, PETSC_COMM_SELF, 1, "Problem '%s' not found", app_ctx->problem_name); 174149fb536SJames Wright PetscCall((*p)(problem, dm, &user, bc)); 175149fb536SJames Wright } 176149fb536SJames Wright 177149fb536SJames Wright // -- Set up DM 178149fb536SJames Wright PetscCall(SetUpDM(dm, problem, app_ctx->degree, app_ctx->q_extra, bc, phys_ctx)); 179149fb536SJames Wright 180149fb536SJames Wright // -- Refine DM for high-order viz 181149fb536SJames Wright if (app_ctx->viz_refine) PetscCall(VizRefineDM(dm, user, problem, bc, phys_ctx)); 182149fb536SJames Wright 183149fb536SJames Wright // --------------------------------------------------------------------------- 184149fb536SJames Wright // Create solution vectors 185149fb536SJames Wright // --------------------------------------------------------------------------- 186149fb536SJames Wright // -- Set up global state vector Q 187149fb536SJames Wright Vec Q; 188149fb536SJames Wright PetscCall(DMCreateGlobalVector(dm, &Q)); 189149fb536SJames Wright PetscCall(VecZeroEntries(Q)); 190149fb536SJames Wright 191149fb536SJames Wright // -- Set up local state vectors Q_loc, Q_dot_loc 192149fb536SJames Wright PetscCall(DMCreateLocalVector(dm, &user->Q_loc)); 193149fb536SJames Wright PetscCall(DMCreateLocalVector(dm, &user->Q_dot_loc)); 194149fb536SJames Wright PetscCall(VecZeroEntries(user->Q_dot_loc)); 195149fb536SJames Wright 196149fb536SJames Wright // --------------------------------------------------------------------------- 197149fb536SJames Wright // Set up libCEED 198149fb536SJames Wright // --------------------------------------------------------------------------- 199149fb536SJames Wright // -- Set up libCEED objects 200149fb536SJames Wright PetscCall(SetupLibceed(ceed, ceed_data, dm, user, app_ctx, problem, bc)); 201149fb536SJames Wright 202149fb536SJames Wright // --------------------------------------------------------------------------- 203149fb536SJames Wright // Set up ICs 204149fb536SJames Wright // --------------------------------------------------------------------------- 205149fb536SJames Wright // -- Fix multiplicity for ICs 206149fb536SJames Wright PetscCall(ICs_FixMultiplicity(dm, ceed_data, user, user->Q_loc, Q, 0.0)); 207149fb536SJames Wright 208149fb536SJames Wright // --------------------------------------------------------------------------- 209149fb536SJames Wright // Record boundary values from initial condition 210149fb536SJames Wright // --------------------------------------------------------------------------- 211149fb536SJames Wright // -- This overrides DMPlexInsertBoundaryValues(). 212149fb536SJames Wright // We use this for the main simulation DM because the reference DMPlexInsertBoundaryValues() is very slow on the GPU due to extra device-to-host 213149fb536SJames Wright // communication. If we disable this, we should still get the same results due to the problem->bc function, but with potentially much slower 214149fb536SJames Wright // execution. 215149fb536SJames Wright if (problem->set_bc_from_ics) { 216149fb536SJames Wright PetscCall(SetBCsFromICs(dm, Q, user->Q_loc)); 217149fb536SJames Wright } 218149fb536SJames Wright 219149fb536SJames Wright // --------------------------------------------------------------------------- 220149fb536SJames Wright // Create output directory 221149fb536SJames Wright // --------------------------------------------------------------------------- 222149fb536SJames Wright PetscMPIInt rank; 223149fb536SJames Wright MPI_Comm_rank(comm, &rank); 224149fb536SJames Wright if (!rank) { 225149fb536SJames Wright PetscCall(PetscMkdir(app_ctx->output_dir)); 226149fb536SJames Wright } 227149fb536SJames Wright 228149fb536SJames Wright // --------------------------------------------------------------------------- 229149fb536SJames Wright // Gather initial Q values in case of continuation of simulation 230149fb536SJames Wright // --------------------------------------------------------------------------- 231149fb536SJames Wright // -- Set up initial values from binary file 232149fb536SJames Wright if (app_ctx->cont_steps) { 233149fb536SJames Wright PetscCall(SetupICsFromBinary(comm, app_ctx, Q)); 234149fb536SJames Wright } 235149fb536SJames Wright 236149fb536SJames Wright // -- Zero Q_loc 237149fb536SJames Wright PetscCall(VecZeroEntries(user->Q_loc)); 238149fb536SJames Wright 239149fb536SJames Wright // --------------------------------------------------------------------------- 240149fb536SJames Wright // TS: Create, setup, and solve 241149fb536SJames Wright // --------------------------------------------------------------------------- 242149fb536SJames Wright TS ts; 243149fb536SJames Wright PetscScalar final_time; 244149fb536SJames Wright PetscCall(TSSolve_NS(dm, user, app_ctx, phys_ctx, problem, &Q, &final_time, &ts)); 245149fb536SJames Wright 246149fb536SJames Wright // --------------------------------------------------------------------------- 247149fb536SJames Wright // Post-processing 248149fb536SJames Wright // --------------------------------------------------------------------------- 249149fb536SJames Wright PetscCall(PostProcess(ts, ceed_data, dm, problem, user, Q, final_time)); 250149fb536SJames Wright 251149fb536SJames Wright // --------------------------------------------------------------------------- 252149fb536SJames Wright // Destroy libCEED objects 253149fb536SJames Wright // --------------------------------------------------------------------------- 254149fb536SJames Wright 255149fb536SJames Wright PetscCall(TurbulenceStatisticsDestroy(user, ceed_data)); 256149fb536SJames Wright PetscCall(NodalProjectionDataDestroy(user->grad_velo_proj)); 257149fb536SJames Wright PetscCall(SgsDDDataDestroy(user->sgs_dd_data)); 258149fb536SJames Wright PetscCall(DifferentialFilterDataDestroy(user->diff_filter)); 259149fb536SJames Wright PetscCall(SGS_DD_TrainingDataDestroy(user->sgs_dd_train)); 260149fb536SJames Wright PetscCall(SmartSimDataDestroy(user->smartsim)); 261149fb536SJames Wright 262149fb536SJames Wright // -- Vectors 263149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&ceed_data->x_coord)); 264149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&ceed_data->q_data)); 265149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&user->q_ceed)); 266149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&user->q_dot_ceed)); 267149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&user->g_ceed)); 268149fb536SJames Wright 269149fb536SJames Wright // -- Bases 270149fb536SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&ceed_data->basis_q)); 271149fb536SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&ceed_data->basis_x)); 272149fb536SJames Wright 273149fb536SJames Wright // -- Restrictions 274149fb536SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&ceed_data->elem_restr_q)); 275149fb536SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&ceed_data->elem_restr_x)); 276149fb536SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&ceed_data->elem_restr_qd_i)); 277149fb536SJames Wright 278149fb536SJames Wright // Destroy QFunction contexts after using 279149fb536SJames Wright // ToDo: Simplify tracked libCEED objects, smaller struct 280149fb536SJames Wright { 281149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_inflow.qfunction_context)); 282149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_inflow_jacobian.qfunction_context)); 283149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_outflow.qfunction_context)); 284149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_outflow_jacobian.qfunction_context)); 285149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_freestream.qfunction_context)); 286149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_freestream_jacobian.qfunction_context)); 287149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_slip.qfunction_context)); 288149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_slip_jacobian.qfunction_context)); 289149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->ics.qfunction_context)); 290149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_vol_rhs.qfunction_context)); 291149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_vol_ifunction.qfunction_context)); 292149fb536SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_vol_ijacobian.qfunction_context)); 293149fb536SJames Wright } 294149fb536SJames Wright 295149fb536SJames Wright // -- Operators 296149fb536SJames Wright PetscCall(OperatorApplyContextDestroy(ceed_data->op_ics_ctx)); 297149fb536SJames Wright PetscCall(OperatorApplyContextDestroy(user->op_rhs_ctx)); 298149fb536SJames Wright PetscCall(OperatorApplyContextDestroy(user->op_strong_bc_ctx)); 299149fb536SJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&user->op_ifunction)); 300149fb536SJames Wright 301149fb536SJames Wright // -- Ceed 302149fb536SJames Wright PetscCheck(CeedDestroy(&ceed) == CEED_ERROR_SUCCESS, comm, PETSC_ERR_LIB, "Destroying Ceed object failed"); 303149fb536SJames Wright 304149fb536SJames Wright if (app_ctx->test_type != TESTTYPE_NONE) { 305149fb536SJames Wright PetscInt num_options_left = 0; 306149fb536SJames Wright PetscCall(PetscOptionsLeftGet(NULL, &num_options_left, NULL, NULL)); 307149fb536SJames Wright PetscCheck(num_options_left == 0, PETSC_COMM_WORLD, -1, 308149fb536SJames Wright "There are unused options. This is not allowed. See error message for the unused options (or use -options_left directly)"); 309149fb536SJames Wright } 310149fb536SJames Wright 311149fb536SJames Wright // --------------------------------------------------------------------------- 312149fb536SJames Wright // Clean up PETSc 313149fb536SJames Wright // --------------------------------------------------------------------------- 314149fb536SJames Wright // -- Vectors 315149fb536SJames Wright PetscCall(VecDestroy(&Q)); 316149fb536SJames Wright PetscCall(VecDestroy(&user->Q_loc)); 317149fb536SJames Wright PetscCall(VecDestroy(&user->Q_dot_loc)); 318149fb536SJames Wright 319149fb536SJames Wright PetscCall(KSPDestroy(&user->mass_ksp)); 320149fb536SJames Wright 321149fb536SJames Wright // -- Matrices 322149fb536SJames Wright PetscCall(MatDestroy(&user->interp_viz)); 323149fb536SJames Wright PetscCall(MatDestroy(&user->mat_ijacobian)); 324149fb536SJames Wright 325149fb536SJames Wright // -- DM 326149fb536SJames Wright PetscCall(DMDestroy(&dm)); 327149fb536SJames Wright PetscCall(DMDestroy(&user->dm_viz)); 328149fb536SJames Wright 329149fb536SJames Wright // -- TS 330149fb536SJames Wright PetscCall(TSDestroy(&ts)); 331149fb536SJames Wright 332149fb536SJames Wright // -- Function list 333149fb536SJames Wright PetscCall(PetscFunctionListDestroy(&app_ctx->problems)); 334149fb536SJames Wright 335149fb536SJames Wright PetscCall(PetscFree(app_ctx->amat_type)); 336149fb536SJames Wright PetscCall(PetscFree(app_ctx->wall_forces.walls)); 337149fb536SJames Wright PetscCall(PetscViewerDestroy(&app_ctx->wall_forces.viewer)); 338149fb536SJames Wright 339149fb536SJames Wright // -- Structs 340149fb536SJames Wright for (PetscInt i = 0; i < problem->num_bc_defs; i++) { 341149fb536SJames Wright PetscCall(BCDefinitionDestroy(&problem->bc_defs[i])); 342149fb536SJames Wright } 343149fb536SJames Wright PetscCall(PetscFree(problem->bc_defs)); 344149fb536SJames Wright PetscCall(PetscFree(units)); 345149fb536SJames Wright PetscCall(PetscFree(user)); 346149fb536SJames Wright PetscCall(PetscFree(problem)); 347149fb536SJames Wright PetscCall(PetscFree(bc)); 348149fb536SJames Wright PetscCall(PetscFree(phys_ctx)); 349149fb536SJames Wright PetscCall(PetscFree(app_ctx)); 350149fb536SJames Wright PetscCall(PetscFree(ceed_data)); 351149fb536SJames Wright PetscCall(PetscFree(problem)); 352149fb536SJames Wright 353149fb536SJames Wright return PetscFinalize(); 354149fb536SJames Wright } 355