1ae2b091fSJames Wright // SPDX-FileCopyrightText: Copyright (c) 2017-2024, HONEE contributors. 2ae2b091fSJames Wright // SPDX-License-Identifier: Apache-2.0 OR BSD-2-Clause 3149fb536SJames Wright 4149fb536SJames Wright // libCEED + PETSc Example: Navier-Stokes 5149fb536SJames Wright // 6149fb536SJames Wright // This example demonstrates a simple usage of libCEED with PETSc to solve a Navier-Stokes problem. 7149fb536SJames Wright // 8149fb536SJames Wright // Build with: 9149fb536SJames Wright // 10149fb536SJames Wright // make [PETSC_DIR=</path/to/petsc>] [CEED_DIR=</path/to/libceed>] navierstokes 11149fb536SJames Wright // 12149fb536SJames Wright // Sample runs: 13149fb536SJames Wright // 14149fb536SJames Wright // ./navierstokes -ceed /cpu/self -options_file gaussianwave.yml 15149fb536SJames Wright // ./navierstokes -ceed /gpu/cuda -problem advection -degree 1 16149fb536SJames Wright // 17149fb536SJames Wright //TESTARGS(name="Newtonian and Riemann Solver Unit Tests",only="cpu") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 1e100 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-IDL-entropy.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 0 -newtonian_unit_tests -riemann_solver_unit_tests 18149fb536SJames Wright //TESTARGS(name="Gaussian Wave, IDL and Entropy variables") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-IDL-entropy.bin -state_var entropy -dm_plex_box_faces 5,5,1 -ts_max_steps 5 -idl_decay_time 2e-3 -idl_length 0.25 -idl_start 0 -idl_pressure 70 195ba826a2SJames Wright //TESTARGS(name="Blasius, SGS DataDriven Sequential Torch",only="torch") -ceed {ceed_resource} -options_file tests/blasius_stgtest.yaml -sgs_model_type data_driven -sgs_model_dd_leakyrelu_alpha 0.3 -sgs_model_dd_parameter_dir examples/dd_sgs_data -ts_dt 2e-9 -state_var primitive -ksp_rtol 1e-12 -snes_rtol 1e-12 -stg_mean_only -stg_fluctuating_IC -test_type solver -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-sgs-data-driven.bin -sgs_model_dd_implementation sequential_torch -sgs_model_dd_torch_model_path ./tests/createPyTorchModel/NNModel_HIT_fp64_jit.pt 205ba826a2SJames Wright //TESTARGS(name="Blasius, SGS DataDriven Sequential Ceed") -ceed {ceed_resource} -options_file tests/blasius_stgtest.yaml -sgs_model_type data_driven -sgs_model_dd_leakyrelu_alpha 0.3 -sgs_model_dd_parameter_dir examples/dd_sgs_data -ts_dt 2e-9 -state_var primitive -ksp_rtol 1e-12 -snes_rtol 1e-12 -stg_mean_only -stg_fluctuating_IC -test_type solver -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-sgs-data-driven.bin -sgs_model_dd_implementation sequential_ceed 21149fb536SJames Wright //TESTARGS(name="Gaussian Wave, explicit, supg, IDL") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 1e-8 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-explicit.bin -dm_plex_box_faces 2,2,1 -ts_max_steps 5 -degree 3 -implicit false -ts_type rk -stab supg -state_var conservative -mass_ksp_type gmres -mass_pc_jacobi_type diagonal -idl_decay_time 2e-3 -idl_length 0.25 -idl_start 0 -idl_pressure 70 22149fb536SJames Wright //TESTARGS(name="Advection 2D, rotation, explicit, supg, consistent mass") -ceed {ceed_resource} -test_type solver -problem advection -degree 3 -dm_plex_box_faces 2,2 -dm_plex_box_lower 0,0 -dm_plex_box_upper 125,125 -bc_wall 1,2,3,4 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ts_dt 1e-3 -ts_max_steps 10 -stab supg -Ctaus 0.5 -mass_ksp_type gmres -mass_pc_type vpbjacobi -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-adv2d-rotation-explicit-stab-supg-consistent-mass.bin 23149fb536SJames Wright //TESTARGS(name="Advection, skew") -ceed {ceed_resource} -test_type solver -options_file examples/advection.yaml -ts_max_steps 5 -wind_type translation -wind_translation -0.5547002,0.83205029,0 -advection_ic_type skew -dm_plex_box_faces 2,1,1 -degree 2 -stab supg -stab_tau advdiff_shakib -Ctau_a 4 -ksp_type gmres -diffusion_coeff 5e-4 -compare_final_state_atol 7e-10 -compare_final_state_filename tests/output/fluids-navierstokes-adv-skew.bin 24*8c85b835SJames Wright //TESTARGS(name="Blasius, bc_slip, Indirect Diffusive Flux Projection") -ceed {ceed_resource} -test_type solver -options_file examples/blasius.yaml -ts_max_steps 5 -dm_plex_box_faces 3,20,1 -platemesh_nDelta 10 -platemesh_growth 1.2 -bc_outflow 5 -bc_slip 4 -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-bc_slip_indirect.bin -div_diff_flux_projection_method indirect 25*8c85b835SJames Wright //TESTARGS(name="Blasius, bc_slip, Direct Diffusive Flux Projection") -ceed {ceed_resource} -test_type solver -options_file examples/blasius.yaml -ts_max_steps 5 -dm_plex_box_faces 3,20,1 -platemesh_nDelta 10 -platemesh_growth 1.2 -bc_outflow 5 -bc_slip 4 -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-bc_slip.bin -div_diff_flux_projection_method direct 26149fb536SJames Wright //TESTARGS(name="Advection, rotation, cosine") -ceed {ceed_resource} -test_type solver -options_file examples/advection.yaml -ts_max_steps 0 -advection_ic_type cosine_hill -dm_plex_box_faces 2,1,1 -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-adv-rotation-cosine.bin 27149fb536SJames Wright //TESTARGS(name="Gaussian Wave, using MatShell") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 1e-8 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-shell.bin -dm_plex_box_faces 2,2,1 -ts_max_steps 5 -degree 3 -amat_type shell -pc_type vpbjacobi -ts_alpha_radius 0.5 28149fb536SJames Wright //TESTARGS(name="Taylor-Green Vortex IC") -ceed {ceed_resource} -problem taylor_green -test_type solver -dm_plex_dim 3 -dm_plex_box_faces 6,6,6 -ts_max_steps 0 -compare_final_state_atol 1e-12 -compare_final_state_filename tests/output/fluids-navierstokes-taylor-green-IC.bin 295ba826a2SJames Wright //TESTARGS(name="Blasius, SGS DataDriven Fused") -ceed {ceed_resource} -options_file tests/blasius_stgtest.yaml -sgs_model_type data_driven -sgs_model_dd_leakyrelu_alpha 0.3 -sgs_model_dd_parameter_dir examples/dd_sgs_data -ts_dt 2e-9 -state_var primitive -ksp_rtol 1e-12 -snes_rtol 1e-12 -stg_mean_only -stg_fluctuating_IC -test_type solver -compare_final_state_atol 1e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius-sgs-data-driven.bin 30149fb536SJames Wright //TESTARGS(name="Blasius, Anisotropic Differential Filter") -ceed {ceed_resource} -test_type diff_filter -options_file tests/blasius_test.yaml -compare_final_state_atol 5e-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_diff_filter_aniso_vandriest.bin -diff_filter_monitor -ts_max_steps 0 -state_var primitive -diff_filter_friction_length 1e-5 -diff_filter_wall_damping_function van_driest -diff_filter_ksp_rtol 1e-8 -diff_filter_grid_based_width -diff_filter_width_scaling 1,0.7,1 31149fb536SJames Wright //TESTARGS(name="Blasius, Isotropic Differential Filter") -ceed {ceed_resource} -test_type diff_filter -options_file tests/blasius_test.yaml -compare_final_state_atol 2e-12 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_diff_filter_iso.bin -diff_filter_monitor -ts_max_steps 0 -diff_filter_width_scaling 4.2e-5,4.2e-5,4.2e-5 -diff_filter_ksp_atol 1e-14 -diff_filter_ksp_rtol 1e-16 32149fb536SJames Wright //TESTARGS(name="Gaussian Wave, with IDL") -ceed {ceed_resource} -test_type solver -options_file examples/gaussianwave.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-gaussianwave-IDL.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 5 -idl_decay_time 2e-3 -idl_length 0.25 -idl_start 0 -ts_alpha_radius 0.5 -idl_pressure 70 33149fb536SJames Wright //TESTARGS(name="Spanwise Turbulence Statistics") -ceed {ceed_resource} -test_type turb_spanstats -options_file tests/stats_test.yaml -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-turb-spanstats-stats.bin 34149fb536SJames Wright //TESTARGS(name="Blasius") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_test.yaml -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius.bin 35149fb536SJames Wright //TESTARGS(name="Blasius, STG Inflow") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_stgtest.yaml -compare_final_state_atol 2E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_STG.bin 36149fb536SJames Wright //TESTARGS(name="Blasius, STG Inflow, Weak Temperature") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_stgtest.yaml -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_STG_weakT.bin -weakT 37149fb536SJames Wright //TESTARGS(name="Blasius, Strong STG Inflow") -ceed {ceed_resource} -test_type solver -options_file tests/blasius_stgtest.yaml -compare_final_state_atol 1E-10 -compare_final_state_filename tests/output/fluids-navierstokes-blasius_STG_strongBC.bin -stg_strong true 38149fb536SJames Wright //TESTARGS(name="Channel") -ceed {ceed_resource} -test_type solver -options_file examples/channel.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-channel.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 5 39149fb536SJames Wright //TESTARGS(name="Channel, Primitive") -ceed {ceed_resource} -test_type solver -options_file examples/channel.yaml -compare_final_state_atol 2e-11 -compare_final_state_filename tests/output/fluids-navierstokes-channel-prim.bin -dm_plex_box_faces 5,5,1 -ts_max_steps 5 -state_var primitive 40149fb536SJames Wright //TESTARGS(name="Density Current, explicit") -ceed {ceed_resource} -test_type solver -degree 3 -q_extra 2 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -bc_symmetry_x 5,6 -bc_symmetry_y 3,4 -bc_symmetry_z 1,2 -units_kilogram 1e-9 -center 62.5,62.5,187.5 -rc 100. -thetaC -35. -mu 75 -gravity 0,0,-9.81 -ts_dt 1e-3 -units_meter 1e-2 -units_second 1e-2 -ts_max_steps 10 -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-dc-explicit.bin 41149fb536SJames Wright //TESTARGS(name="Density Current, implicit, no stabilization") -ceed {ceed_resource} -test_type solver -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -bc_symmetry_x 5,6 -bc_symmetry_y 3,4 -bc_symmetry_z 1,2 -units_kilogram 1e-9 -center 62.5,62.5,187.5 -rc 100. -thetaC -35. -mu 75 -gravity 0,0,-9.81 -units_meter 1e-2 -units_second 1e-2 -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -ts_type alpha -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-dc-implicit-stab-none.bin 42149fb536SJames Wright //TESTARGS(name="Advection, rotation, implicit, SUPG stabilization") -ceed {ceed_resource} -test_type solver -problem advection -CtauS .3 -stab supg -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -bc_wall 1,2,3,4,5,6 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -compare_final_state_atol 5E-4 -ts_max_steps 10 -compare_final_state_filename tests/output/fluids-navierstokes-adv-rotation-implicit-stab-supg.bin 43149fb536SJames Wright //TESTARGS(name="Advection, translation, implicit, SU stabilization") -ceed {ceed_resource} -test_type solver -problem advection -CtauS .3 -stab su -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -units_kilogram 1e-9 -rc 100. -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -wind_type translation -wind_translation .53,-1.33,-2.65 -bc_inflow 1,2,3,4,5,6 -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-adv-translation-implicit-stab-su.bin 44149fb536SJames Wright //TESTARGS(name="Advection 2D, rotation, explicit, strong form") -ceed {ceed_resource} -test_type solver -problem advection -strong_form 1 -degree 3 -dm_plex_box_faces 2,2 -dm_plex_box_lower 0,0 -dm_plex_box_upper 125,125 -bc_wall 1,2,3,4 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ts_dt 1e-3 -compare_final_state_atol 5E-11 -ts_max_steps 10 -compare_final_state_filename tests/output/fluids-navierstokes-adv2d-rotation-explicit-strong.bin 45149fb536SJames Wright //TESTARGS(name="Advection 2D, rotation, implicit, SUPG stabilization") -ceed {ceed_resource} -test_type solver -problem advection -CtauS .3 -stab supg -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0 -dm_plex_box_upper 125,125 -bc_wall 1,2,3,4 -wall_comps 4 -units_kilogram 1e-9 -rc 100. -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-adv2d-rotation-implicit-stab-supg.bin 46149fb536SJames Wright //TESTARGS(name="Euler, implicit") -ceed {ceed_resource} -test_type solver -problem euler_vortex -degree 3 -dm_plex_box_faces 1,1,2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -units_meter 1e-4 -units_second 1e-4 -mean_velocity 1.4,-2.,0 -bc_inflow 4,6 -bc_outflow 3,5 -bc_symmetry_z 1,2 -vortex_strength 2 -ksp_atol 1e-4 -ksp_rtol 1e-3 -ksp_type bcgs -snes_atol 1e-3 -snes_lag_jacobian 100 -snes_lag_jacobian_persists -snes_mf_operator -ts_dt 1e-3 -implicit -dm_mat_preallocate_skip 0 -ts_type alpha -ts_max_steps 10 -compare_final_state_atol 5E-4 -compare_final_state_filename tests/output/fluids-navierstokes-euler-implicit.bin 47149fb536SJames Wright //TESTARGS(name="Euler, explicit") -ceed {ceed_resource} -test_type solver -problem euler_vortex -degree 3 -q_extra 2 -dm_plex_box_faces 2,2,1 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 125,125,250 -dm_plex_dim 3 -units_meter 1e-4 -units_second 1e-4 -mean_velocity 1.4,-2.,0 -bc_inflow 4,6 -bc_outflow 3,5 -bc_symmetry_z 1,2 -vortex_strength 2 -ts_dt 1e-7 -ts_rk_type 5bs -ts_rtol 1e-10 -ts_atol 1e-10 -ts_max_steps 10 -compare_final_state_atol 1E-7 -compare_final_state_filename tests/output/fluids-navierstokes-euler-explicit.bin 48149fb536SJames Wright //TESTARGS(name="Sod Shocktube, explicit, SU stabilization, y-z-beta shock capturing") -ceed {ceed_resource} -test_type solver -problem shocktube -degree 1 -q_extra 2 -dm_plex_box_faces 50,1,1 -units_meter 1e-2 units_second 1e-2 -dm_plex_box_lower 0,0,0 -dm_plex_box_upper 1000,20,20 -dm_plex_dim 3 -bc_symmetry_x 5,6 -bc_symmetry_y 3,4 -bc_symmetry_z 1,2 -yzb -stab su -ts_max_steps 10 -compare_final_state_atol 1E-11 -compare_final_state_filename tests/output/fluids-navierstokes-shocktube-explicit-su-yzb.bin 49149fb536SJames Wright 50149fb536SJames Wright /// @file 51149fb536SJames Wright /// Navier-Stokes example using PETSc 52149fb536SJames Wright 53149fb536SJames Wright const char help[] = "Solve Navier-Stokes using PETSc and libCEED\n"; 54149fb536SJames Wright 55149fb536SJames Wright #include <navierstokes.h> 56149fb536SJames Wright #include <petscdevice.h> 57149fb536SJames Wright 58149fb536SJames Wright #include <ceed.h> 59149fb536SJames Wright #include <petscdmplex.h> 60149fb536SJames Wright #include <petscts.h> 61149fb536SJames Wright 62149fb536SJames Wright int main(int argc, char **argv) { 63149fb536SJames Wright // --------------------------------------------------------------------------- 64149fb536SJames Wright // Initialize PETSc 65149fb536SJames Wright // --------------------------------------------------------------------------- 66149fb536SJames Wright PetscCall(PetscInitialize(&argc, &argv, NULL, help)); 67149fb536SJames Wright 68149fb536SJames Wright // --------------------------------------------------------------------------- 69149fb536SJames Wright // Create structs 70149fb536SJames Wright // --------------------------------------------------------------------------- 71149fb536SJames Wright AppCtx app_ctx; 72149fb536SJames Wright PetscCall(PetscCalloc1(1, &app_ctx)); 73149fb536SJames Wright 74149fb536SJames Wright ProblemData problem; 75149fb536SJames Wright PetscCall(PetscCalloc1(1, &problem)); 76149fb536SJames Wright 77149fb536SJames Wright User user; 78149fb536SJames Wright PetscCall(PetscCalloc1(1, &user)); 79149fb536SJames Wright 80149fb536SJames Wright CeedData ceed_data; 81149fb536SJames Wright PetscCall(PetscCalloc1(1, &ceed_data)); 82149fb536SJames Wright 83149fb536SJames Wright SimpleBC bc; 84149fb536SJames Wright PetscCall(PetscCalloc1(1, &bc)); 85149fb536SJames Wright 86149fb536SJames Wright Physics phys_ctx; 87149fb536SJames Wright PetscCall(PetscCalloc1(1, &phys_ctx)); 88149fb536SJames Wright 89149fb536SJames Wright Units units; 90149fb536SJames Wright PetscCall(PetscCalloc1(1, &units)); 91149fb536SJames Wright 92149fb536SJames Wright user->app_ctx = app_ctx; 93149fb536SJames Wright user->units = units; 94149fb536SJames Wright user->phys = phys_ctx; 95149fb536SJames Wright problem->set_bc_from_ics = PETSC_TRUE; 96149fb536SJames Wright 97149fb536SJames Wright PetscCall(RegisterLogEvents()); 98149fb536SJames Wright 99149fb536SJames Wright // --------------------------------------------------------------------------- 100149fb536SJames Wright // Process command line options 101149fb536SJames Wright // --------------------------------------------------------------------------- 102149fb536SJames Wright // -- Register problems to be available on the command line 103149fb536SJames Wright PetscCall(RegisterProblems_NS(app_ctx)); 104149fb536SJames Wright 105149fb536SJames Wright // -- Process general command line options 106149fb536SJames Wright MPI_Comm comm = PETSC_COMM_WORLD; 107149fb536SJames Wright user->comm = comm; 108149fb536SJames Wright PetscCall(ProcessCommandLineOptions(comm, app_ctx, bc)); 109149fb536SJames Wright PetscCall(BoundaryConditionSetUp(user, problem, app_ctx, bc)); 110149fb536SJames Wright 111149fb536SJames Wright // --------------------------------------------------------------------------- 112149fb536SJames Wright // Initialize libCEED 113149fb536SJames Wright // --------------------------------------------------------------------------- 114149fb536SJames Wright // -- Initialize backend 115149fb536SJames Wright Ceed ceed; 116149fb536SJames Wright PetscCheck(CeedInit(app_ctx->ceed_resource, &ceed) == CEED_ERROR_SUCCESS, comm, PETSC_ERR_LIB, "Ceed initialization failed"); 117149fb536SJames Wright user->ceed = ceed; 118149fb536SJames Wright 119149fb536SJames Wright PetscCheck(CeedSetErrorHandler(ceed, CeedErrorStore) == CEED_ERROR_SUCCESS, comm, PETSC_ERR_LIB, "Setting libCEED error handler failed"); 120149fb536SJames Wright 121149fb536SJames Wright // -- Check preferred MemType 122149fb536SJames Wright CeedMemType mem_type_backend; 123149fb536SJames Wright PetscCallCeed(ceed, CeedGetPreferredMemType(ceed, &mem_type_backend)); 124149fb536SJames Wright 125149fb536SJames Wright { 126149fb536SJames Wright const char *resource; 127149fb536SJames Wright PetscCallCeed(ceed, CeedGetResource(ceed, &resource)); 128149fb536SJames Wright if (strstr(resource, "/gpu/sycl")) { 129149fb536SJames Wright PetscDeviceContext dctx; 130149fb536SJames Wright PetscCall(PetscDeviceContextGetCurrentContext(&dctx)); 131149fb536SJames Wright void *stream_handle; 132149fb536SJames Wright PetscCall(PetscDeviceContextGetStreamHandle(dctx, &stream_handle)); 133149fb536SJames Wright PetscCallCeed(ceed, CeedSetStream(ceed, stream_handle)); 134149fb536SJames Wright } 135149fb536SJames Wright } 136149fb536SJames Wright 137149fb536SJames Wright // --------------------------------------------------------------------------- 138149fb536SJames Wright // Set up global mesh 139149fb536SJames Wright // --------------------------------------------------------------------------- 140149fb536SJames Wright // -- Create DM 141149fb536SJames Wright DM dm; 142149fb536SJames Wright VecType vec_type = NULL; 143149fb536SJames Wright MatType mat_type = NULL; 144149fb536SJames Wright switch (mem_type_backend) { 145149fb536SJames Wright case CEED_MEM_HOST: 146149fb536SJames Wright vec_type = VECSTANDARD; 147149fb536SJames Wright break; 148149fb536SJames Wright case CEED_MEM_DEVICE: { 149149fb536SJames Wright const char *resolved; 150149fb536SJames Wright PetscCallCeed(ceed, CeedGetResource(ceed, &resolved)); 151149fb536SJames Wright if (strstr(resolved, "/gpu/cuda")) vec_type = VECCUDA; 152149fb536SJames Wright else if (strstr(resolved, "/gpu/hip")) vec_type = VECKOKKOS; 153149fb536SJames Wright else if (strstr(resolved, "/gpu/sycl")) vec_type = VECKOKKOS; 154149fb536SJames Wright else vec_type = VECSTANDARD; 155149fb536SJames Wright } 156149fb536SJames Wright } 157149fb536SJames Wright if (strstr(vec_type, VECCUDA)) mat_type = MATAIJCUSPARSE; 158149fb536SJames Wright else if (strstr(vec_type, VECKOKKOS)) mat_type = MATAIJKOKKOS; 159149fb536SJames Wright else mat_type = MATAIJ; 160149fb536SJames Wright PetscCall(CreateDM(comm, problem, mat_type, vec_type, &dm)); 161149fb536SJames Wright user->dm = dm; 162149fb536SJames Wright PetscCall(DMSetApplicationContext(dm, user)); 163149fb536SJames Wright 164149fb536SJames Wright // --------------------------------------------------------------------------- 165149fb536SJames Wright // Choose the problem from the list of registered problems 166149fb536SJames Wright // --------------------------------------------------------------------------- 167149fb536SJames Wright { 168149fb536SJames Wright PetscErrorCode (*p)(ProblemData, DM, void *, SimpleBC); 169149fb536SJames Wright PetscCall(PetscFunctionListFind(app_ctx->problems, app_ctx->problem_name, &p)); 170149fb536SJames Wright PetscCheck(p, PETSC_COMM_SELF, 1, "Problem '%s' not found", app_ctx->problem_name); 171149fb536SJames Wright PetscCall((*p)(problem, dm, &user, bc)); 172149fb536SJames Wright } 173149fb536SJames Wright 174149fb536SJames Wright // -- Set up DM 175149fb536SJames Wright PetscCall(SetUpDM(dm, problem, app_ctx->degree, app_ctx->q_extra, bc, phys_ctx)); 176149fb536SJames Wright 177149fb536SJames Wright // -- Refine DM for high-order viz 178149fb536SJames Wright if (app_ctx->viz_refine) PetscCall(VizRefineDM(dm, user, problem, bc, phys_ctx)); 179149fb536SJames Wright 180149fb536SJames Wright // --------------------------------------------------------------------------- 181149fb536SJames Wright // Create solution vectors 182149fb536SJames Wright // --------------------------------------------------------------------------- 183149fb536SJames Wright // -- Set up global state vector Q 184149fb536SJames Wright Vec Q; 185149fb536SJames Wright PetscCall(DMCreateGlobalVector(dm, &Q)); 186149fb536SJames Wright PetscCall(VecZeroEntries(Q)); 187149fb536SJames Wright 188149fb536SJames Wright // -- Set up local state vectors Q_loc, Q_dot_loc 189149fb536SJames Wright PetscCall(DMCreateLocalVector(dm, &user->Q_loc)); 190149fb536SJames Wright PetscCall(DMCreateLocalVector(dm, &user->Q_dot_loc)); 191149fb536SJames Wright PetscCall(VecZeroEntries(user->Q_dot_loc)); 192149fb536SJames Wright 193149fb536SJames Wright // --------------------------------------------------------------------------- 194149fb536SJames Wright // Set up libCEED 195149fb536SJames Wright // --------------------------------------------------------------------------- 196149fb536SJames Wright // -- Set up libCEED objects 197149fb536SJames Wright PetscCall(SetupLibceed(ceed, ceed_data, dm, user, app_ctx, problem, bc)); 198149fb536SJames Wright 199149fb536SJames Wright // --------------------------------------------------------------------------- 200149fb536SJames Wright // Set up ICs 201149fb536SJames Wright // --------------------------------------------------------------------------- 202149fb536SJames Wright // -- Fix multiplicity for ICs 203149fb536SJames Wright PetscCall(ICs_FixMultiplicity(dm, ceed_data, user, user->Q_loc, Q, 0.0)); 204149fb536SJames Wright 205149fb536SJames Wright // --------------------------------------------------------------------------- 206149fb536SJames Wright // Record boundary values from initial condition 207149fb536SJames Wright // --------------------------------------------------------------------------- 208149fb536SJames Wright // -- This overrides DMPlexInsertBoundaryValues(). 209149fb536SJames Wright // We use this for the main simulation DM because the reference DMPlexInsertBoundaryValues() is very slow on the GPU due to extra device-to-host 210149fb536SJames Wright // communication. If we disable this, we should still get the same results due to the problem->bc function, but with potentially much slower 211149fb536SJames Wright // execution. 212149fb536SJames Wright if (problem->set_bc_from_ics) { 213149fb536SJames Wright PetscCall(SetBCsFromICs(dm, Q, user->Q_loc)); 214149fb536SJames Wright } 215149fb536SJames Wright 216149fb536SJames Wright // --------------------------------------------------------------------------- 217149fb536SJames Wright // Create output directory 218149fb536SJames Wright // --------------------------------------------------------------------------- 219149fb536SJames Wright PetscMPIInt rank; 220149fb536SJames Wright MPI_Comm_rank(comm, &rank); 221149fb536SJames Wright if (!rank) { 222149fb536SJames Wright PetscCall(PetscMkdir(app_ctx->output_dir)); 223149fb536SJames Wright } 224149fb536SJames Wright 225149fb536SJames Wright // --------------------------------------------------------------------------- 226149fb536SJames Wright // Gather initial Q values in case of continuation of simulation 227149fb536SJames Wright // --------------------------------------------------------------------------- 228149fb536SJames Wright // -- Set up initial values from binary file 229149fb536SJames Wright if (app_ctx->cont_steps) { 230db90dbaaSJames Wright PetscViewer viewer; 231db90dbaaSJames Wright 232db90dbaaSJames Wright PetscCall(PetscViewerBinaryOpen(comm, app_ctx->cont_file, FILE_MODE_READ, &viewer)); 233db90dbaaSJames Wright PetscCall(HoneeLoadBinaryVec(viewer, Q, &app_ctx->cont_time, &app_ctx->cont_steps)); 234db90dbaaSJames Wright PetscCall(PetscViewerDestroy(&viewer)); 235149fb536SJames Wright } 236149fb536SJames Wright 237149fb536SJames Wright // -- Zero Q_loc 238149fb536SJames Wright PetscCall(VecZeroEntries(user->Q_loc)); 239149fb536SJames Wright 240149fb536SJames Wright // --------------------------------------------------------------------------- 241149fb536SJames Wright // TS: Create, setup, and solve 242149fb536SJames Wright // --------------------------------------------------------------------------- 243149fb536SJames Wright TS ts; 244149fb536SJames Wright PetscScalar final_time; 245149fb536SJames Wright PetscCall(TSSolve_NS(dm, user, app_ctx, phys_ctx, problem, &Q, &final_time, &ts)); 246149fb536SJames Wright 247149fb536SJames Wright // --------------------------------------------------------------------------- 248149fb536SJames Wright // Post-processing 249149fb536SJames Wright // --------------------------------------------------------------------------- 250149fb536SJames Wright PetscCall(PostProcess(ts, ceed_data, dm, problem, user, Q, final_time)); 251149fb536SJames Wright 252149fb536SJames Wright // --------------------------------------------------------------------------- 253149fb536SJames Wright // Destroy libCEED objects 254149fb536SJames Wright // --------------------------------------------------------------------------- 255149fb536SJames Wright 256149fb536SJames Wright PetscCall(TurbulenceStatisticsDestroy(user, ceed_data)); 257149fb536SJames Wright PetscCall(NodalProjectionDataDestroy(user->grad_velo_proj)); 258149fb536SJames Wright PetscCall(SgsDDDataDestroy(user->sgs_dd_data)); 259149fb536SJames Wright PetscCall(DifferentialFilterDataDestroy(user->diff_filter)); 260149fb536SJames Wright PetscCall(SGS_DD_TrainingDataDestroy(user->sgs_dd_train)); 261149fb536SJames Wright PetscCall(SmartSimDataDestroy(user->smartsim)); 262e816a7e4SJames Wright PetscCall(QDataClearStoredData()); 263*8c85b835SJames Wright PetscCall(DivDiffFluxProjectionDataDestroy(user->diff_flux_proj)); 264149fb536SJames Wright 265149fb536SJames Wright // -- Vectors 266149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&ceed_data->x_coord)); 267149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&user->q_ceed)); 268149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&user->q_dot_ceed)); 269149fb536SJames Wright PetscCallCeed(ceed, CeedVectorDestroy(&user->g_ceed)); 270149fb536SJames Wright 271149fb536SJames Wright // -- Bases 272149fb536SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&ceed_data->basis_q)); 273149fb536SJames Wright PetscCallCeed(ceed, CeedBasisDestroy(&ceed_data->basis_x)); 274149fb536SJames Wright 275149fb536SJames Wright // -- Restrictions 276149fb536SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&ceed_data->elem_restr_q)); 277149fb536SJames Wright PetscCallCeed(ceed, CeedElemRestrictionDestroy(&ceed_data->elem_restr_x)); 278149fb536SJames Wright 279149fb536SJames Wright // Destroy QFunction contexts after using 280149fb536SJames Wright // ToDo: Simplify tracked libCEED objects, smaller struct 281149fb536SJames Wright { 282e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_inflow.qfctx)); 283e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_inflow_jacobian.qfctx)); 284e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_outflow.qfctx)); 285e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_outflow_jacobian.qfctx)); 286e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_freestream.qfctx)); 287e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_freestream_jacobian.qfctx)); 288e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_slip.qfctx)); 289e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_slip_jacobian.qfctx)); 290e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->ics.qfctx)); 291e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_vol_rhs.qfctx)); 292e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_vol_ifunction.qfctx)); 293e07531f7SJames Wright PetscCallCeed(ceed, CeedQFunctionContextDestroy(&problem->apply_vol_ijacobian.qfctx)); 294149fb536SJames Wright } 295149fb536SJames Wright 296149fb536SJames Wright // -- Operators 297149fb536SJames Wright PetscCall(OperatorApplyContextDestroy(ceed_data->op_ics_ctx)); 298149fb536SJames Wright PetscCall(OperatorApplyContextDestroy(user->op_rhs_ctx)); 299149fb536SJames Wright PetscCall(OperatorApplyContextDestroy(user->op_strong_bc_ctx)); 300149fb536SJames Wright PetscCallCeed(ceed, CeedOperatorDestroy(&user->op_ifunction)); 301149fb536SJames Wright 302149fb536SJames Wright // -- Ceed 303149fb536SJames Wright PetscCheck(CeedDestroy(&ceed) == CEED_ERROR_SUCCESS, comm, PETSC_ERR_LIB, "Destroying Ceed object failed"); 304149fb536SJames Wright 305149fb536SJames Wright if (app_ctx->test_type != TESTTYPE_NONE) { 306149fb536SJames Wright PetscInt num_options_left = 0; 307149fb536SJames Wright PetscCall(PetscOptionsLeftGet(NULL, &num_options_left, NULL, NULL)); 308149fb536SJames Wright PetscCheck(num_options_left == 0, PETSC_COMM_WORLD, -1, 309149fb536SJames Wright "There are unused options. This is not allowed. See error message for the unused options (or use -options_left directly)"); 310149fb536SJames Wright } 311149fb536SJames Wright 312149fb536SJames Wright // --------------------------------------------------------------------------- 313149fb536SJames Wright // Clean up PETSc 314149fb536SJames Wright // --------------------------------------------------------------------------- 315149fb536SJames Wright // -- Vectors 316149fb536SJames Wright PetscCall(VecDestroy(&Q)); 317149fb536SJames Wright PetscCall(VecDestroy(&user->Q_loc)); 318149fb536SJames Wright PetscCall(VecDestroy(&user->Q_dot_loc)); 319149fb536SJames Wright 320149fb536SJames Wright PetscCall(KSPDestroy(&user->mass_ksp)); 321149fb536SJames Wright 322149fb536SJames Wright // -- Matrices 323149fb536SJames Wright PetscCall(MatDestroy(&user->interp_viz)); 324149fb536SJames Wright PetscCall(MatDestroy(&user->mat_ijacobian)); 325149fb536SJames Wright 326149fb536SJames Wright // -- DM 327149fb536SJames Wright PetscCall(DMDestroy(&dm)); 328149fb536SJames Wright PetscCall(DMDestroy(&user->dm_viz)); 329149fb536SJames Wright 330149fb536SJames Wright // -- TS 331149fb536SJames Wright PetscCall(TSDestroy(&ts)); 332149fb536SJames Wright 333149fb536SJames Wright // -- Function list 334149fb536SJames Wright PetscCall(PetscFunctionListDestroy(&app_ctx->problems)); 335149fb536SJames Wright 336149fb536SJames Wright PetscCall(PetscFree(app_ctx->amat_type)); 337149fb536SJames Wright PetscCall(PetscFree(app_ctx->wall_forces.walls)); 338a29281c9SJames Wright PetscCall(PetscViewerDestroy(&app_ctx->wall_forces.viewer)); 339a29281c9SJames Wright PetscCall(PetscViewerDestroy(&app_ctx->turb_spanstats_viewer)); 340149fb536SJames Wright 341149fb536SJames Wright // -- Structs 342149fb536SJames Wright for (PetscInt i = 0; i < problem->num_bc_defs; i++) { 343149fb536SJames Wright PetscCall(BCDefinitionDestroy(&problem->bc_defs[i])); 344149fb536SJames Wright } 345149fb536SJames Wright PetscCall(PetscFree(problem->bc_defs)); 346149fb536SJames Wright PetscCall(PetscFree(units)); 347149fb536SJames Wright PetscCall(PetscFree(user)); 348149fb536SJames Wright PetscCall(PetscFree(problem)); 349149fb536SJames Wright PetscCall(PetscFree(bc)); 350149fb536SJames Wright PetscCall(PetscFree(phys_ctx)); 351149fb536SJames Wright PetscCall(PetscFree(app_ctx)); 352149fb536SJames Wright PetscCall(PetscFree(ceed_data)); 353149fb536SJames Wright PetscCall(PetscFree(problem)); 354149fb536SJames Wright 355149fb536SJames Wright return PetscFinalize(); 356149fb536SJames Wright } 357