From 2655f96894742a0398ceb591b1e990b425d9adf5 Mon Sep 17 00:00:00 2001 From: Ann Almgren Date: Wed, 4 Dec 2024 19:08:02 -0800 Subject: [PATCH] use generalized bc's for FFT preconditioner (#1986) * use generalized bc's for FFT preconditioner * update amrex * use new interface to PoissonHybrid * ignore unused * inline function * update to FFT stuff * fix order of members * FFT-preconditioned GMRES now works on actual terrain! * remove WitchOfAgnesi_JAMES --- CMakeLists.txt | 2 +- .../WitchOfAgnesi_JAMES/CMakeLists.txt | 15 - .../WitchOfAgnesi_JAMES/ERF_prob.H | 63 ----- .../WitchOfAgnesi_JAMES/ERF_prob.cpp | 163 ----------- .../WitchOfAgnesi_JAMES/GNUmakefile | 33 --- .../WitchOfAgnesi_JAMES/Make.package | 2 - Exec/DryRegTests/WitchOfAgnesi_JAMES/README | 6 - .../WitchOfAgnesi_JAMES/input_sounding | 202 -------------- Exec/DryRegTests/WitchOfAgnesi_JAMES/inputs | 76 ----- Source/ERF.H | 7 +- Source/LinearSolvers/ERF_FFT_TerrainPrecond.H | 262 ------------------ Source/LinearSolvers/ERF_FFT_Utils.H | 73 +++++ Source/LinearSolvers/ERF_PoissonSolve.cpp | 11 +- Source/LinearSolvers/ERF_TerrainPoisson.H | 11 +- Source/LinearSolvers/ERF_TerrainPoisson.cpp | 85 ++++-- Source/LinearSolvers/ERF_solve_with_fft.cpp | 76 +---- Source/LinearSolvers/ERF_solve_with_gmres.cpp | 8 +- Source/LinearSolvers/Make.package | 4 +- 18 files changed, 178 insertions(+), 921 deletions(-) delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/CMakeLists.txt delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.H delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.cpp delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/GNUmakefile delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/Make.package delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/README delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/input_sounding delete mode 100644 Exec/DryRegTests/WitchOfAgnesi_JAMES/inputs delete mode 100644 Source/LinearSolvers/ERF_FFT_TerrainPrecond.H create mode 100644 Source/LinearSolvers/ERF_FFT_Utils.H diff --git a/CMakeLists.txt b/CMakeLists.txt index 515237115..b3f999462 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -245,7 +245,7 @@ target_link_libraries(erf_api PUBLIC erf_srclib) add_library(${PROJECT_NAME}::erf_api ALIAS erf_srclib) # Collect all headers and make them installable with the target -set(ERF_INCLUDES "Source/ERF.H;Source/ERF_Constants.H;Source/WindFarmParametrization/SimpleActuatorDisk/ERF_SimpleAD.H;Source/WindFarmParametrization/EWP/ERF_EWP.H;Source/WindFarmParametrization/Null/ERF_NullWindFarm.H;Source/WindFarmParametrization/ERF_WindFarm.H;Source/WindFarmParametrization/Fitch/ERF_Fitch.H;Source/BoundaryConditions/ERF_PhysBCFunct.H;Source/BoundaryConditions/ERF_MOSTAverage.H;Source/BoundaryConditions/ERF_MOSTRoughness.H;Source/BoundaryConditions/ERF_ABLMost.H;Source/BoundaryConditions/ERF_FillPatcher.H;Source/BoundaryConditions/ERF_MOSTStress.H;Source/BoundaryConditions/ERF_TimeInterpolatedData.H;Source/Utils/ERF_Interpolation.H;Source/Utils/ERF_TileNoZ.H;Source/Utils/ERF_PlaneAverage.H;Source/Utils/ERF_Interpolation_WENO.H;Source/Utils/ERF_DirectionSelector.H;Source/Utils/ERF_ParFunctions.H;Source/Utils/ERF_Wstar.H;Source/Utils/ERF_Microphysics_Utils.H;Source/Utils/ERF_Sat_methods.H;Source/Utils/ERF_Interpolation_1D.H;Source/Utils/ERF_Interpolation_UPW.H;Source/Utils/ERF_TerrainMetrics.H;Source/Utils/ERF_Interpolation_WENO_Z.H;Source/Utils/ERF_Thetav.H;Source/Utils/ERF_Water_vapor_saturation.H;Source/Utils/ERF_Utils.H;Source/Utils/ERF_Orbit.H;Source/Utils/ERF_EOS.H;Source/Utils/ERF_HSE_utils.H;Source/EB/ERF_TerrainIF.H;Source/EB/ERF_FlowerIF.H;Source/EB/ERF_eb_if.H;Source/Particles/ERFPC.H;Source/Particles/ERF_ParticleData.H;Source/Prob/ERF_init_density_hse_dry.H;Source/Prob/ERF_init_rayleigh_damping.H;Source/Prob/ERF_init_constant_density_hse.H;Source/ERF_prob_common.H;Source/ERF_Derive.H;Source/Radiation/ERF_Mam4_constituents.H;Source/Radiation/ERF_Mam4_aero.H;Source/Radiation/ERF_Optics.H;Source/Radiation/ERF_Modal_aero_wateruptake.H;Source/Radiation/ERF_Cloud_rad_props.H;Source/Radiation/ERF_Phys_prop.H;Source/Radiation/ERF_Radiation.H;Source/Radiation/ERF_Albedo.H;Source/Radiation/ERF_Parameterizations.H;Source/Radiation/ERF_Rad_constants.H;Source/Radiation/ERF_Aero_rad_props.H;Source/Radiation/ERF_m2005_effradius.H;Source/Radiation/ERF_Linear_interpolate.H;Source/Radiation/ERF_Slingo.H;Source/Radiation/ERF_Rrtmgp.H;Source/Radiation/ERF_Ebert_curry.H;Source/SourceTerms/ERF_NumericalDiffusion.H;Source/SourceTerms/ERF_Src_headers.H;Source/IO/ERF_SampleData.H;Source/IO/ERF_NCInterface.H;Source/IO/ERF_NCWpsFile.H;Source/IO/ERF_NCPlotFile.H;Source/IO/ERF_ReadBndryPlanes.H;Source/IO/ERF_WriteBndryPlanes.H;Source/PBL/ERF_MYNNStruct.H;Source/PBL/ERF_PBLModels.H;Source/PBL/ERF_PBLHeight.H;Source/TimeIntegration/ERF_TI_substep_fun.H;Source/TimeIntegration/ERF_TI_slow_headers.H;Source/TimeIntegration/ERF_TI_slow_rhs_fun.H;Source/TimeIntegration/ERF_TI_fast_headers.H;Source/TimeIntegration/ERF_TI_utils.H;Source/TimeIntegration/ERF_MRI.H;Source/TimeIntegration/ERF_TI_no_substep_fun.H;Source/LandSurfaceModel/Null/ERF_NullSurf.H;Source/LandSurfaceModel/ERF_LandSurface.H;Source/LandSurfaceModel/MM5/ERF_MM5.H;Source/LandSurfaceModel/SLM/ERF_SLM.H;Source/ERF_IndexDefines.H;Source/Advection/ERF_AdvectionSrcForMom_N.H;Source/Advection/ERF_AdvectionSrcForScalars.H;Source/Advection/ERF_AdvectionSrcForMom_T.H;Source/Advection/ERF_Advection.H;Source/MultiBlock/ERF_MultiBlockContainer.H;Source/Initialization/ERF_Metgrid_utils.H;Source/Diffusion/ERF_EddyViscosity.H;Source/Diffusion/ERF_Diffusion.H;Source/Microphysics/Null/ERF_NullMoistLagrangian.H;Source/Microphysics/Null/ERF_NullMoist.H;Source/Microphysics/ERF_Microphysics.H;Source/Microphysics/ERF_LagrangianMicrophysics.H;Source/Microphysics/ERF_EulerianMicrophysics.H;Source/Microphysics/Kessler/ERF_Kessler.H;Source/Microphysics/SAM/ERF_SAM.H;Source/DataStructs/ERF_InputSpongeData.H;Source/DataStructs/ERF_TurbPertStruct.H;Source/DataStructs/ERF_SpongeStruct.H;Source/DataStructs/ERF_AdvStruct.H;Source/DataStructs/ERF_DataStruct.H;Source/DataStructs/ERF_InputSoundingData.H;Source/DataStructs/ERF_DiffStruct.H;Source/DataStructs/ERF_TurbStruct.H ERF_TerrainPoisson.H ERF_FFT_TerrainPrecond.H") +set(ERF_INCLUDES "Source/ERF.H;Source/ERF_Constants.H;Source/WindFarmParametrization/SimpleActuatorDisk/ERF_SimpleAD.H;Source/WindFarmParametrization/EWP/ERF_EWP.H;Source/WindFarmParametrization/Null/ERF_NullWindFarm.H;Source/WindFarmParametrization/ERF_WindFarm.H;Source/WindFarmParametrization/Fitch/ERF_Fitch.H;Source/BoundaryConditions/ERF_PhysBCFunct.H;Source/BoundaryConditions/ERF_MOSTAverage.H;Source/BoundaryConditions/ERF_MOSTRoughness.H;Source/BoundaryConditions/ERF_ABLMost.H;Source/BoundaryConditions/ERF_FillPatcher.H;Source/BoundaryConditions/ERF_MOSTStress.H;Source/BoundaryConditions/ERF_TimeInterpolatedData.H;Source/Utils/ERF_Interpolation.H;Source/Utils/ERF_TileNoZ.H;Source/Utils/ERF_PlaneAverage.H;Source/Utils/ERF_Interpolation_WENO.H;Source/Utils/ERF_DirectionSelector.H;Source/Utils/ERF_ParFunctions.H;Source/Utils/ERF_Wstar.H;Source/Utils/ERF_Microphysics_Utils.H;Source/Utils/ERF_Sat_methods.H;Source/Utils/ERF_Interpolation_1D.H;Source/Utils/ERF_Interpolation_UPW.H;Source/Utils/ERF_TerrainMetrics.H;Source/Utils/ERF_Interpolation_WENO_Z.H;Source/Utils/ERF_Thetav.H;Source/Utils/ERF_Water_vapor_saturation.H;Source/Utils/ERF_Utils.H;Source/Utils/ERF_Orbit.H;Source/Utils/ERF_EOS.H;Source/Utils/ERF_HSE_utils.H;Source/EB/ERF_TerrainIF.H;Source/EB/ERF_FlowerIF.H;Source/EB/ERF_eb_if.H;Source/Particles/ERFPC.H;Source/Particles/ERF_ParticleData.H;Source/Prob/ERF_init_density_hse_dry.H;Source/Prob/ERF_init_rayleigh_damping.H;Source/Prob/ERF_init_constant_density_hse.H;Source/ERF_prob_common.H;Source/ERF_Derive.H;Source/Radiation/ERF_Mam4_constituents.H;Source/Radiation/ERF_Mam4_aero.H;Source/Radiation/ERF_Optics.H;Source/Radiation/ERF_Modal_aero_wateruptake.H;Source/Radiation/ERF_Cloud_rad_props.H;Source/Radiation/ERF_Phys_prop.H;Source/Radiation/ERF_Radiation.H;Source/Radiation/ERF_Albedo.H;Source/Radiation/ERF_Parameterizations.H;Source/Radiation/ERF_Rad_constants.H;Source/Radiation/ERF_Aero_rad_props.H;Source/Radiation/ERF_m2005_effradius.H;Source/Radiation/ERF_Linear_interpolate.H;Source/Radiation/ERF_Slingo.H;Source/Radiation/ERF_Rrtmgp.H;Source/Radiation/ERF_Ebert_curry.H;Source/SourceTerms/ERF_NumericalDiffusion.H;Source/SourceTerms/ERF_Src_headers.H;Source/IO/ERF_SampleData.H;Source/IO/ERF_NCInterface.H;Source/IO/ERF_NCWpsFile.H;Source/IO/ERF_NCPlotFile.H;Source/IO/ERF_ReadBndryPlanes.H;Source/IO/ERF_WriteBndryPlanes.H;Source/PBL/ERF_MYNNStruct.H;Source/PBL/ERF_PBLModels.H;Source/PBL/ERF_PBLHeight.H;Source/TimeIntegration/ERF_TI_substep_fun.H;Source/TimeIntegration/ERF_TI_slow_headers.H;Source/TimeIntegration/ERF_TI_slow_rhs_fun.H;Source/TimeIntegration/ERF_TI_fast_headers.H;Source/TimeIntegration/ERF_TI_utils.H;Source/TimeIntegration/ERF_MRI.H;Source/TimeIntegration/ERF_TI_no_substep_fun.H;Source/LandSurfaceModel/Null/ERF_NullSurf.H;Source/LandSurfaceModel/ERF_LandSurface.H;Source/LandSurfaceModel/MM5/ERF_MM5.H;Source/LandSurfaceModel/SLM/ERF_SLM.H;Source/ERF_IndexDefines.H;Source/Advection/ERF_AdvectionSrcForMom_N.H;Source/Advection/ERF_AdvectionSrcForScalars.H;Source/Advection/ERF_AdvectionSrcForMom_T.H;Source/Advection/ERF_Advection.H;Source/MultiBlock/ERF_MultiBlockContainer.H;Source/Initialization/ERF_Metgrid_utils.H;Source/Diffusion/ERF_EddyViscosity.H;Source/Diffusion/ERF_Diffusion.H;Source/Microphysics/Null/ERF_NullMoistLagrangian.H;Source/Microphysics/Null/ERF_NullMoist.H;Source/Microphysics/ERF_Microphysics.H;Source/Microphysics/ERF_LagrangianMicrophysics.H;Source/Microphysics/ERF_EulerianMicrophysics.H;Source/Microphysics/Kessler/ERF_Kessler.H;Source/Microphysics/SAM/ERF_SAM.H;Source/DataStructs/ERF_InputSpongeData.H;Source/DataStructs/ERF_TurbPertStruct.H;Source/DataStructs/ERF_SpongeStruct.H;Source/DataStructs/ERF_AdvStruct.H;Source/DataStructs/ERF_DataStruct.H;Source/DataStructs/ERF_InputSoundingData.H;Source/DataStructs/ERF_DiffStruct.H;Source/DataStructs/ERF_TurbStruct.H ERF_TerrainPoisson.H ERF_FFT_Utils.H") set_target_properties( erf_srclib PROPERTIES PUBLIC_HEADER "${ERF_INCLUDES}") diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/CMakeLists.txt b/Exec/DryRegTests/WitchOfAgnesi_JAMES/CMakeLists.txt deleted file mode 100644 index 1b0c8295f..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/CMakeLists.txt +++ /dev/null @@ -1,15 +0,0 @@ -set(erf_exe_name erf_witch_of_agnesi) - -add_executable(${erf_exe_name} "") -target_sources(${erf_exe_name} - PRIVATE - ERF_prob.cpp -) - -target_include_directories(${erf_exe_name} PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}) - -include(${CMAKE_SOURCE_DIR}/CMake/BuildERFExe.cmake) -build_erf_exe(${erf_exe_name}) - -#find_package(AMReX) -#target_link_libraries( ${_target} AMReX::amrex) diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.H b/Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.H deleted file mode 100644 index e8d701b3b..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.H +++ /dev/null @@ -1,63 +0,0 @@ -#ifndef ERF_PROB_H_ -#define ERF_PROB_H_ - -#include - -#include "AMReX_REAL.H" - -#include "ERF_prob_common.H" - -struct ProbParm : ProbParmDefaults { - // perturbations to initial conditions - amrex::Real rho_0 = 0.0; - amrex::Real T_0 = 0.0; - amrex::Real U_0 = 0.0; - amrex::Real V_0 = 0.0; - amrex::Real W_0 = 0.0; // needed for rayleigh damping - - // hill parameters - amrex::Real hmax = 0.0; // full hill height, can be negative to simulate valleys - amrex::Real L = 0.0; // hill length at half-height -}; // namespace ProbParm - -class Problem : public ProblemBase -{ -public: - Problem(); - -#include "Prob/ERF_init_density_hse_dry.H" -#include "Prob/ERF_init_rayleigh_damping.H" - - void init_custom_pert ( - const amrex::Box& bx, - const amrex::Box& xbx, - const amrex::Box& ybx, - const amrex::Box& zbx, - amrex::Array4 const& state, - amrex::Array4 const& state_pert, - amrex::Array4 const& x_vel_pert, - amrex::Array4 const& y_vel_pert, - amrex::Array4 const& z_vel_pert, - amrex::Array4 const& r_hse, - amrex::Array4 const& p_hse, - amrex::Array4 const& z_nd, - amrex::Array4 const& z_cc, - amrex::GeometryData const& geomdata, - amrex::Array4 const& mf_m, - amrex::Array4 const& mf_u, - amrex::Array4 const& mf_v, - const SolverChoice& sc) override; - - void init_custom_terrain ( - const amrex::Geometry& geom, - amrex::MultiFab& z_phys_nd, - const amrex::Real& time) override; - -protected: - std::string name() override { return "Witch of Agnesi Hill"; } - -private: - ProbParm parms; -}; - -#endif diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.cpp b/Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.cpp deleted file mode 100644 index d30a98cc7..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/ERF_prob.cpp +++ /dev/null @@ -1,163 +0,0 @@ -#include "ERF_prob.H" -#include "ERF_TerrainMetrics.H" - -using namespace amrex; - -std::unique_ptr -amrex_probinit ( - const amrex_real* /*problo*/, - const amrex_real* /*probhi*/) -{ - return std::make_unique(); -} - -Problem::Problem () -{ - // Parse params - ParmParse pp("prob"); - pp.query("rho_0", parms.rho_0); - pp.query("T_0", parms.T_0); - pp.query("U_0", parms.U_0); - pp.query("V_0", parms.V_0); - pp.query("W_0", parms.W_0); - - pp.query("hmax", parms.hmax); - pp.query("L", parms.L); - - init_base_parms(parms.rho_0, parms.T_0); -} - -void -Problem::init_custom_pert ( - const Box& bx, - const Box& xbx, - const Box& ybx, - const Box& zbx, - Array4 const& /*state*/, - Array4 const& state_pert, - Array4 const& x_vel_pert, - Array4 const& y_vel_pert, - Array4 const& z_vel_pert, - Array4 const& /*r_hse*/, - Array4 const& /*p_hse*/, - Array4 const& z_nd, - Array4 const& /*z_cc*/, - GeometryData const& geomdata, - Array4 const& /*mf_m*/, - Array4 const& /*mf_u*/, - Array4 const& /*mf_v*/, - const SolverChoice& sc) -{ - const bool use_moisture = (sc.moisture_type != MoistureType::None); - - ParallelFor(bx, [=] AMREX_GPU_DEVICE(int i, int j, int k) noexcept - { - // Set scalar = 0 everywhere - state_pert(i, j, k, RhoScalar_comp) = 0.0; - - if (use_moisture) { - state_pert(i, j, k, RhoQ1_comp) = 0.0; - state_pert(i, j, k, RhoQ2_comp) = 0.0; - } - }); - - // Set the x-velocity - ParallelFor(xbx, [=, parms_d=parms] AMREX_GPU_DEVICE(int i, int j, int k) noexcept - { - x_vel_pert(i, j, k) = parms_d.U_0; - }); - - // Set the y-velocity - ParallelFor(ybx, [=] AMREX_GPU_DEVICE(int i, int j, int k) noexcept - { - y_vel_pert(i, j, k) = 0.0; - }); - - const auto dx = geomdata.CellSize(); - amrex::GpuArray dxInv; - dxInv[0] = 1. / dx[0]; - dxInv[1] = 1. / dx[1]; - dxInv[2] = 1. / dx[2]; - - // Set the z-velocity from impenetrable condition - ParallelFor(zbx, [=] AMREX_GPU_DEVICE(int i, int j, int k) noexcept - { - z_vel_pert(i, j, k) = WFromOmega(i, j, k, 0.0, x_vel_pert, y_vel_pert, z_nd, dxInv); - }); - - amrex::Gpu::streamSynchronize(); -} - -void -Problem::init_custom_terrain ( - const Geometry& geom, - MultiFab& z_phys_nd, - const Real& time) -{ - - // Check if a valid text file exists for the terrain - std::string fname; - ParmParse pp("erf"); - auto valid_fname = pp.query("terrain_file_name",fname); - if (valid_fname) { - this->read_custom_terrain(fname,geom,z_phys_nd,time); - } else { - // Domain cell size and real bounds - auto dx = geom.CellSizeArray(); - auto ProbLoArr = geom.ProbLoArray(); - auto ProbHiArr = geom.ProbHiArray(); - - // Domain valid box (z_nd is nodal) - const amrex::Box& domain = geom.Domain(); - int domlo_x = domain.smallEnd(0); int domhi_x = domain.bigEnd(0) + 1; - // int domlo_y = domain.smallEnd(1); int domhi_y = domain.bigEnd(1) + 1; - int domlo_z = domain.smallEnd(2); - - // User function parameters - Real a = 0.5; - Real num = 8 * a * a * a; - Real xcen = 0.5 * (ProbLoArr[0] + ProbHiArr[0]); - // Real ycen = 0.5 * (ProbLoArr[1] + ProbHiArr[1]); - - // if hm is nonzero, then use alternate hill definition - Real hm = parms.hmax; - Real L = parms.L; - - // Number of ghost cells - int ngrow = z_phys_nd.nGrow(); - - // Populate bottom plane - int k0 = domlo_z; - - for ( amrex::MFIter mfi(z_phys_nd,amrex::TilingIfNotGPU()); mfi.isValid(); ++mfi ) - { - amrex::Box zbx = mfi.nodaltilebox(2); - if (zbx.smallEnd(2) > k0) continue; - - // Grown box with no z range - amrex::Box xybx = mfi.growntilebox(ngrow); - xybx.setRange(2,0); - - amrex::Array4 const& z_arr = z_phys_nd.array(mfi); - - ParallelFor(xybx, [=] AMREX_GPU_DEVICE (int i, int j, int) - { - // Clip indices for ghost-cells - int ii = amrex::min(amrex::max(i,domlo_x),domhi_x); - // int jj = amrex::min(amrex::max(j,domlo_y),domhi_y); - - // Location of nodes - Real x = (ProbLoArr[0] + ii * dx[0] - xcen); - // Real y = (jj * dx[1] - ycen); - - // WoA Hill in x-direction - if (hm==0) { - z_arr(i,j,k0) = num / (x*x + 4 * a * a); - } else { - Real x_L = x / L; - z_arr(i,j,k0) = hm / (1 + x_L*x_L); - } - }); - } - } -} diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/GNUmakefile b/Exec/DryRegTests/WitchOfAgnesi_JAMES/GNUmakefile deleted file mode 100644 index eb058c96c..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/GNUmakefile +++ /dev/null @@ -1,33 +0,0 @@ -# AMReX -COMP = gnu -PRECISION = DOUBLE - -# Profiling -PROFILE = FALSE -TINY_PROFILE = FALSE -COMM_PROFILE = FALSE -TRACE_PROFILE = FALSE -MEM_PROFILE = FALSE -USE_GPROF = FALSE - -# Performance -USE_MPI = TRUE -USE_OMP = FALSE - -USE_CUDA = FALSE -USE_HIP = FALSE -USE_SYCL = FALSE - -# Debugging -DEBUG = FALSE - -TEST = TRUE -USE_ASSERTION = TRUE - -# GNU Make -Bpack := ./Make.package -Blocs := . - -ERF_HOME := ../../.. -ERF_PROBLEM_DIR = $(ERF_HOME)/Exec/DryRegTests/WitchOfAgnesi_JAMES -include $(ERF_HOME)/Exec/Make.ERF diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/Make.package b/Exec/DryRegTests/WitchOfAgnesi_JAMES/Make.package deleted file mode 100644 index 5fc21f61c..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/Make.package +++ /dev/null @@ -1,2 +0,0 @@ -CEXE_headers += ERF_prob.H -CEXE_sources += ERF_prob.cpp diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/README b/Exec/DryRegTests/WitchOfAgnesi_JAMES/README deleted file mode 100644 index cacb58b78..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/README +++ /dev/null @@ -1,6 +0,0 @@ -This problem setup is for flow over an idealized hill with a "Witch of Agnesi" profile. -The domain is periodic in the y-direction, with inflow at low x and outflow at high x. -The terrain-fitted coordinates follow the contour of the hill. - -This problem is primarily designed to test the implementation of the terrain-fitted coordinates. - diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/input_sounding b/Exec/DryRegTests/WitchOfAgnesi_JAMES/input_sounding deleted file mode 100644 index d91f8160c..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/input_sounding +++ /dev/null @@ -1,202 +0,0 @@ -1000 300 0 -0 300 0 10 0 -0.1 300.000305810553 0 10 0 -0.160723065020908 300.000491508247 0 10 0 -0.224482283292861 300.000686490948 0 10 0 -0.291429462478412 300.000891222922 0 10 0 -0.361724000623241 300.001106191644 0 10 0 -0.435533265675311 300.001331908968 0 10 0 -0.513032993979984 300.001568912341 0 10 0 -0.594407708699891 300.001817766084 0 10 0 -0.679851159155793 300.002079062737 0 10 0 -0.769566782134491 300.002353424467 0 10 0 -0.863768186262123 300.002641504554 0 10 0 -0.962679660596138 300.002943988942 0 10 0 -1.06653670864685 300.003261597879 0 10 0 -1.1755866091001 300.003595087624 0 10 0 -1.29008900457602 300.003945252255 0 10 0 -1.41031651982572 300.004312925558 0 10 0 -1.53655541083792 300.004698983011 0 10 0 -1.66910624640072 300.005104343871 0 10 0 -1.80828462374167 300.005529973364 0 10 0 -1.95442191994966 300.005976884981 0 10 0 -2.10786608096805 300.006446142896 0 10 0 -2.26898245003736 300.006938864496 0 10 0 -2.43815463756014 300.007456223047 0 10 0 -2.61578543445905 300.007999450486 0 10 0 -2.80229777120291 300.008569840356 0 10 0 -2.99813572478396 300.009168750886 0 10 0 -3.20376557604407 300.00979760823 0 10 0 -3.41967691986718 300.010457909859 0 10 0 -3.64638383088145 300.011151228134 0 10 0 -3.88442608744643 300.011879214047 0 10 0 -4.13437045683966 300.012643601157 0 10 0 -4.39681204470255 300.013446209719 0 10 0 -4.67237571195859 300.014288951019 0 10 0 -4.96171756257742 300.015173831933 0 10 0 -5.2655265057272 300.016102959701 0 10 0 -5.58452589603447 300.017078546954 0 10 0 -5.9194752558571 300.018102916984 0 10 0 -6.27117208367086 300.01917850928 0 10 0 -6.64045375287532 300.02030788534 0 10 0 -7.02819950553999 300.02149373478 0 10 0 -7.4353325458379 300.022738881736 0 10 0 -7.8628222381507 300.024046291601 0 10 0 -8.31168641507915 300.025419078091 0 10 0 -8.78299380085401 300.026860510666 0 10 0 -9.27786655591762 300.028374022323 0 10 0 -9.79748294873441 300.02996321778 0 10 0 -10.343080161192 300.03163188207 0 10 0 -10.9159572342726 300.033383989562 0 10 0 -11.5174781610071 300.03522371344 0 10 0 -12.1490751340783 300.037155435654 0 10 0 -12.8122519558032 300.039183757364 0 10 0 -13.5085876186142 300.041313509916 0 10 0 -14.2397400645659 300.043549766366 0 10 0 -15.0074501328151 300.045897853577 0 10 0 -15.8135457044767 300.048363364926 0 10 0 -16.6599460547215 300.050952173646 0 10 0 -17.5486664224785 300.053670446841 0 10 0 -18.4818228086233 300.056524660199 0 10 0 -19.4616370140754 300.059521613446 0 10 0 -20.4904419298 300.062668446572 0 10 0 -21.5706870913109 300.065972656871 0 10 0 -22.7049445108974 300.069442116846 0 10 0 -23.8959148014632 300.073085092993 0 10 0 -25.1464336065572 300.076910265546 0 10 0 -26.459478351906 300.080926749207 0 10 0 -27.8381753345222 300.08514411491 0 10 0 -29.2858071662692 300.089572412689 0 10 0 -30.8058205896036 300.094222195688 0 10 0 -32.4018346841047 300.099104545376 0 10 0 -34.0776494833309 300.104231098039 0 10 0 -35.8372550225183 300.109614072588 0 10 0 -37.6848408386651 300.115266299782 0 10 0 -39.6248059456193 300.121201252906 0 10 0 -41.6617693079212 300.127433080003 0 10 0 -43.8005808383381 300.133976637721 0 10 0 -46.046332945276 300.14084752687 0 10 0 -48.4043726575607 300.148062129764 0 10 0 -50.8803143554596 300.155637649446 0 10 0 -53.4800531382535 300.163592150892 0 10 0 -56.2097788601871 300.171944604288 0 10 0 -59.0759908682173 300.180714930494 0 10 0 -62.0855134766491 300.189924048799 0 10 0 -65.2455122155025 300.199593927083 0 10 0 -68.5635108912985 300.209747634525 0 10 0 -72.0474095008844 300.220409396956 0 10 0 -75.7055030409495 300.231604655027 0 10 0 -79.5465012580179 300.243360125306 0 10 0 -83.5795493859397 300.255703864478 0 10 0 -87.8142499202576 300.268665336786 0 10 0 -92.2606854812914 300.282275484895 0 10 0 -96.9294428203768 300.29656680435 0 10 0 -101.831638026417 300.311573421807 0 10 0 -106.978942992758 300.32733117724 0 10 0 -112.383613207417 300.343877710322 0 10 0 -118.058516932809 300.361252551202 0 10 0 -124.01716584447 300.3794972159 0 10 0 -130.273747201715 300.39865530656 0 10 0 -136.843157626821 300.418772616821 0 10 0 -143.741038573183 300.439897242553 0 10 0 -150.983813566863 300.462079698262 0 10 0 -158.588727310228 300.485373039445 0 10 0 -166.57388674076 300.509832991201 0 10 0 -174.958304142819 300.535518083443 0 10 0 -183.761942414981 300.562489793045 0 10 0 -193.005762600751 300.590812693291 0 10 0 -202.711773795809 300.620554611012 0 10 0 -212.90308555062 300.651786791824 0 10 0 -223.603962893172 300.684584073882 0 10 0 -234.839884102852 300.719025070621 0 10 0 -246.637601373015 300.755192362945 0 10 0 -259.025204506687 300.793172701387 0 10 0 -272.032187797042 300.833057218757 0 10 0 -285.689520251915 300.874941653865 0 10 0 -300.029719329532 300.918926586887 0 10 0 -315.086928361029 300.965117687037 0 10 0 -330.896997844102 301.013625973195 0 10 0 -347.497570801328 301.064568088193 0 10 0 -364.928172406415 301.118066587535 0 10 0 -383.230304091757 301.174250243313 0 10 0 -402.447542361366 301.233254364182 0 10 0 -422.625642544455 301.29522113227 0 10 0 -443.812647736698 301.360299957982 0 10 0 -466.059003188554 301.428647853691 0 10 0 -489.417676413003 301.500429827374 0 10 0 -513.944283298674 301.575819297339 0 10 0 -539.697220528629 301.654998529233 0 10 0 -566.737804620081 301.738159096591 0 10 0 -595.130417916106 301.825502366315 0 10 0 -624.942661876932 301.917240010488 0 10 0 -656.2455180358 302.013594546083 0 10 0 -689.113517002611 302.114799904181 0 10 0 -723.624915917762 302.221102030456 0 10 0 -759.861884778671 302.332759518767 0 10 0 -797.910702082626 302.450044279837 0 10 0 -837.861960251778 302.573242247137 0 10 0 -879.810781329388 302.702654122226 0 10 0 -923.857043460878 302.838596161948 0 10 0 -970.105618698943 302.981401010067 0 10 0 -1018.66662269891 303.131418576098 0 10 0 -1069.65567689888 303.289016964272 0 10 0 -1123.19418380884 303.454583455798 0 10 0 -1179.40961606431 303.628525547815 0 10 0 -1238.43581993254 303.811272052652 0 10 0 -1300.41333399419 304.003274261307 0 10 0 -1365.48972375892 304.20500717532 0 10 0 -1433.81993301189 304.416970811561 0 10 0 -1505.5666527275 304.639691584752 0 10 0 -1580.9007084289 304.873723772962 0 10 0 -1660.00146691536 305.119651071676 0 10 0 -1743.05726332615 305.378088242506 0 10 0 -1830.26584955748 305.649682863082 0 10 0 -1921.83486510038 305.935117185178 0 10 0 -2017.98233142042 306.235110108722 0 10 0 -2118.93717105646 306.550419279929 0 10 0 -2224.9397526743 306.881843322521 0 10 0 -2336.24246337304 307.230224211701 0 10 0 -2453.11030960671 307.59644980141 0 10 0 -2575.82154815207 307.981456516271 0 10 0 -2704.66834862469 308.386232220612 0 10 0 -2839.95748912095 308.811819278049 0 10 0 -2982.01108664202 309.259317816308 0 10 0 -3131.16736403914 309.729889213266 0 10 0 -3287.78145530612 310.224759821641 0 10 0 -3452.22625113645 310.745224951361 0 10 0 -3624.89328675829 311.292653130385 0 10 0 -3806.19367416122 311.868490666714 0 10 0 -3996.55908093431 312.47426653646 0 10 0 -4196.44275804604 313.111597625229 0 10 0 -4406.32061901337 313.782194352696 0 10 0 -4626.69237302906 314.487866713194 0 10 0 -4858.08271474553 315.230530768355 0 10 0 -5101.04257354783 316.012215631462 0 10 0 -5356.15042529024 316.835070987167 0 10 0 -5624.01366961977 317.701375194693 0 10 0 -5905.27007616578 318.613544027622 0 10 0 -6200.58930303909 319.574140108901 0 10 0 -6510.67449125607 320.585883105897 0 10 0 -6836.26393888389 321.651660757288 0 10 0 -7178.13285889311 322.774540811279 0 10 0 -7537.09522490278 323.957783963396 0 10 0 -7914.00570921294 325.204857891787 0 10 0 -8309.76171773861 326.519452498994 0 10 0 -8725.30552669056 327.905496481415 0 10 0 -9161.62652609011 329.367175361605 0 10 0 -9619.76357545964 330.908951134176 0 10 0 -10100.8074772976 332.535583693757 0 10 0 -10605.9035742275 334.25215423341 0 10 0 -11136.2544760039 336.064090824536 0 10 0 -11693.1229228692 337.977196414921 0 10 0 -12277.8347920776 339.997679510655 0 10 0 -12891.7822547466 342.132187840735 0 10 0 -13536.4270905489 344.387845340804 0 10 0 -14213.3041681414 346.772292835399 0 10 0 -14924.0250996135 349.29373284709 0 10 0 -15670.2820776592 351.960979016934 0 10 0 -16453.8519046071 354.783510684875 0 10 0 -17276.6002229025 357.77153325238 0 10 0 -18140.4859571127 360.936045034252 0 10 0 -19047.5659780333 364.288911404021 0 10 0 -20000 367.84294714969 0 10 0 diff --git a/Exec/DryRegTests/WitchOfAgnesi_JAMES/inputs b/Exec/DryRegTests/WitchOfAgnesi_JAMES/inputs deleted file mode 100644 index c6bb252f3..000000000 --- a/Exec/DryRegTests/WitchOfAgnesi_JAMES/inputs +++ /dev/null @@ -1,76 +0,0 @@ -# ------------------ INPUTS TO MAIN PROGRAM ------------------- -max_step = 3000000 - -amrex.fpe_trap_invalid = 0 - -fabarray.mfiter_tile_size = 1024 1024 1024 - -# PROBLEM SIZE & GEOMETRY -geometry.prob_lo = -72000. 0. 0. -geometry.prob_hi = 72000. 1. 20000. # zhi not used with grid stretching -amr.n_cell = 288 1 200 - -geometry.is_periodic = 0 1 0 - -#erf.initial_dz = 10 -#erf.grid_stretching_ratio = 1.03 - -erf.terrain_z_levels = 0.000000 0.100000 0.160723 0.224482 0.291429 0.361724 0.435533 0.513033 0.594408 0.679851 0.769567 0.863768 0.962680 1.066537 1.175587 1.290089 1.410317 1.536555 1.669106 1.808285 1.954422 2.107866 2.268982 2.438155 2.615785 2.802298 2.998136 3.203766 3.419677 3.646384 3.884426 4.134370 4.396812 4.672376 4.961718 5.265527 5.584526 5.919475 6.271172 6.640454 7.028200 7.435333 7.862822 8.311686 8.782994 9.277867 9.797483 10.343080 10.915957 11.517478 12.149075 12.812252 13.508588 14.239740 15.007450 15.813546 16.659946 17.548666 18.481823 19.461637 20.490442 21.570687 22.704945 23.895915 25.146434 26.459478 27.838175 29.285807 30.805821 32.401835 34.077649 35.837255 37.684841 39.624806 41.661769 43.800581 46.046333 48.404373 50.880314 53.480053 56.209779 59.075991 62.085513 65.245512 68.563511 72.047410 75.705503 79.546501 83.579549 87.814250 92.260685 96.929443 101.831638 106.978943 112.383613 118.058517 124.017166 130.273747 136.843158 143.741039 150.983814 158.588727 166.573887 174.958304 183.761942 193.005763 202.711774 212.903086 223.603963 234.839884 246.637601 259.025205 272.032188 285.689520 300.029719 315.086928 330.896998 347.497571 364.928172 383.230304 402.447542 422.625643 443.812648 466.059003 489.417676 513.944283 539.697221 566.737805 595.130418 624.942662 656.245518 689.113517 723.624916 759.861885 797.910702 837.861960 879.810781 923.857043 970.105619 1018.666623 1069.655677 1123.194184 1179.409616 1238.435820 1300.413334 1365.489724 1433.819933 1505.566653 1580.900708 1660.001467 1743.057263 1830.265850 1921.834865 2017.982331 2118.937171 2224.939753 2336.242463 2453.110310 2575.821548 2704.668349 2839.957489 2982.011087 3131.167364 3287.781455 3452.226251 3624.893287 3806.193674 3996.559081 4196.442758 4406.320619 4626.692373 4858.082715 5101.042574 5356.150425 5624.013670 5905.270076 6200.589303 6510.674491 6836.263939 7178.132859 7537.095225 7914.005709 8309.761718 8725.305527 9161.626526 9619.763575 10100.807477 10605.903574 11136.254476 11693.122923 12277.834792 12891.782255 13536.427091 14213.304168 14924.025100 15670.282078 16453.851905 17276.600223 18140.485957 19047.565978 20000.000000 - -xlo.type = "Inflow" -xhi.type = "Outflow" -xlo.velocity = 10. 0. 0. -#xlo.density = 1.0 -#xlo.theta = 300. -#xlo.scalar = 0. - -zlo.type = "SlipWall" -zhi.type = "SlipWall" -#zhi.theta_grad = 0.003 - -# TIME STEP CONTROL -#erf.substepping_type = None -erf.fixed_mri_dt_ratio = 4 -erf.fixed_dt = 0.03 - -# DIAGNOSTICS & VERBOSITY -erf.sum_interval = 1 # timesteps between computing mass -erf.v = 1 # verbosity in ERF.cpp -amr.v = 1 # verbosity in Amr.cpp - -# REFINEMENT / REGRIDDING -amr.max_level = 0 # maximum level number allowed - -# CHECKPOINT FILES -erf.check_file = chk # root name of checkpoint file -erf.check_int = 1000 # number of timesteps between checkpoints - -# PLOTFILES -erf.plot_file_1 = plt # prefix of plotfile name -erf.plot_int_1 = 5000 # number of timesteps between plotfiles -erf.plot_vars_1 = density x_velocity y_velocity z_velocity pressure theta pert_pres pert_dens - -# SOLVER CHOICE -erf.use_gravity = true -erf.use_coriolis = false -erf.les_type = "None" - -erf.molec_diff_type = "None" -#erf.dynamicViscosity = 1e-5 # [kg/(m-s)] - -erf.rayleigh_damp_W = true -erf.rayleigh_zdamp = 5000.0 -erf.rayleigh_dampcoef = 0.2 - -erf.init_type = "input_sounding" -erf.init_sounding_ideal = true - -# TERRRAIN GRID TYPE -erf.terrain_type = Static -#erf.terrain_smoothing = 1 # Smoothed Terrain Following coords (Klemp 2011) -#erf.terrain_gamma_m = 0.5 -erf.terrain_smoothing = 2 # Sullivan TF - -# PROBLEM PARAMETERS -prob.hmax = 1.0 # full hill height -prob.L = 1000.0 # hill length at half-height diff --git a/Source/ERF.H b/Source/ERF.H index 07055ed5a..0aa02f4ab 100644 --- a/Source/ERF.H +++ b/Source/ERF.H @@ -177,7 +177,6 @@ public: amrex::MultiFab& p); #ifdef ERF_USE_FFT - amrex::Array,AMREX_SPACEDIM> get_fft_bc () const noexcept; void solve_with_fft (int lev, amrex::MultiFab& rhs, amrex::MultiFab& p, amrex::Array& fluxes); #endif @@ -187,7 +186,7 @@ public: #endif void solve_with_gmres (int lev, amrex::Vector& rhs, amrex::Vector& p, - amrex::Array& fluxes); + amrex::Vector>& fluxes); void solve_with_mlmg (int lev, amrex::Vector& rhs, amrex::Vector& p, amrex::Vector>& fluxes); @@ -1378,8 +1377,8 @@ private: #endif #ifdef ERF_USE_FFT - std::unique_ptr> m_3D_poisson; - std::unique_ptr> m_2D_poisson; + amrex::Vector>> m_3D_poisson; + amrex::Vector>> m_2D_poisson; #endif public: diff --git a/Source/LinearSolvers/ERF_FFT_TerrainPrecond.H b/Source/LinearSolvers/ERF_FFT_TerrainPrecond.H deleted file mode 100644 index 941fe3f29..000000000 --- a/Source/LinearSolvers/ERF_FFT_TerrainPrecond.H +++ /dev/null @@ -1,262 +0,0 @@ -#ifndef ERF_FFT_TERRAIN_PRECOND_H_ -#define ERF_FFT_TERRAIN_PRECOND_H_ - -#include -#include -#include - -namespace amrex::FFT -{ - -/** - * \brief 3D Preconditioner for terrain problems with periodic boundaries in the first two - * dimensions and Neumann in the last dimension. - */ -template -class PoissonTerrainPrecond -{ -public: - using T = typename MF::value_type; - - template ,int> = 0> - explicit PoissonTerrainPrecond (Geometry const& geom) - : m_geom(geom), m_r2c(geom.Domain(), Info().setBatchMode(true)) - { - AMREX_ALWAYS_ASSERT(geom.isPeriodic(0) && geom.isPeriodic(1)); - } - - void solve (MF& soln, MF const& rhs, MF const& height); - - template - void solve_doit (MF& soln, MF const& rhs, MF const& height, DZ const& dz); // has to be public for cuda - -private: - Geometry m_geom; - R2C m_r2c; -}; - -template -void PoissonTerrainPrecond::solve (MF& soln, MF const& rhs, MF const& height) -{ - auto delz = T(m_geom.CellSize(AMREX_SPACEDIM-1)); - solve_doit(soln, rhs, height, fft_poisson_detail::DZ{delz}); -} - -template -template -void PoissonTerrainPrecond::solve_doit (MF& soln, MF const& rhs, MF const& height, DZ const& dz) -{ - BL_PROFILE("FFT::PoissonTerrainPrecond::solve"); - -#if (AMREX_SPACEDIM < 3) - amrex::ignore_unused(soln, rhs, dz); -#else - auto facx = T(2)*Math::pi()/T(m_geom.ProbLength(0)); - auto facy = T(2)*Math::pi()/T(m_geom.ProbLength(1)); - - auto dx =T(m_geom.CellSize(0)); - auto dy = T(m_geom.CellSize(1)); - - auto dxinv = T(m_geom.InvCellSize(0)); - auto dyinv = T(m_geom.InvCellSize(1)); - - auto scale = T(1.0)/(T(m_geom.Domain().length(0)) * - T(m_geom.Domain().length(1))); - auto ny = m_geom.Domain().length(1); - auto nz = m_geom.Domain().length(2); - - Box cdomain = m_geom.Domain(); - cdomain.setBig(0,cdomain.length(0)/2); - auto cba = amrex::decompose(cdomain, ParallelContext::NProcsSub(), - {AMREX_D_DECL(true,true,false)}); - DistributionMapping dm = detail::make_iota_distromap(cba.size()); - FabArray > > spmf(cba, dm, 1, 0); - - m_r2c.forward(rhs, spmf); - - for (MFIter mfi(spmf); mfi.isValid(); ++mfi) - { - auto const& spectral = spmf.array(mfi); - auto const& box = mfi.validbox(); - auto const& xybox = amrex::makeSlab(box, 2, 0); - - auto const zp = height.const_array(mfi); - -#ifdef AMREX_USE_GPU - // xxxxx TODO: We need to explore how to optimize this - // function. Maybe we can use cusparse. Maybe we should make - // z-direction to be the unit stride direction. - - FArrayBox tridiag_workspace(box,4); - auto const& ald = tridiag_workspace.array(0); - auto const& bd = tridiag_workspace.array(1); - auto const& cud = tridiag_workspace.array(2); - auto const& scratch = tridiag_workspace.array(3); - - amrex::ParallelFor(xybox, [=] AMREX_GPU_DEVICE (int i, int j, int) - { - T a = facx*i; - T b = (j < ny/2) ? facy*j : facy*(ny-j); - - T k2 = T(2)*(std::cos(a*dx)-T(1))/(dx*dx) - + T(2)*(std::cos(b*dy)-T(1))/(dy*dy); - - // Tridiagonal solve with homogeneous Neumann - for(int k=0; k < nz; k++) { - Real hzeta_inv_on_cc = 4.0 / ( (zp(i,j,k+1) + zp(i+1,j,k+1) + zp(i,j+1,k+1) + zp(i+1,j+1,k+1)) - -(zp(i,j,k ) + zp(i+1,j,k ) + zp(i,j+1,k ) + zp(i+1,j+1,k )) ); - if(k==0) { - - Real hzeta_inv_on_zhi = 8.0 / ( (zp(i,j,k+2) + zp(i+1,j,k+2) + zp(i,j+1,k+2) + zp(i+1,j+1,k+2)) - -(zp(i,j,k ) + zp(i+1,j,k ) + zp(i,j+1,k ) + zp(i+1,j+1,k )) ); - Real h_xi_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i+1,j,k+1) - zp(i,j+1,k+1) - zp(i,j,k+1)) * dxinv; - Real h_eta_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i,j+1,k+1) - zp(i+1,j,k+1) - zp(i,j,k+1)) * dyinv; - - ald(i,j,k) = 0.; - cud(i,j,k) = hzeta_inv_on_cc * (1.0 + h_xi_on_zhi*h_xi_on_zhi + h_eta_on_zhi*h_eta_on_zhi) * hzeta_inv_on_zhi; - bd(i,j,k) = k2 - ald(i,j,k) - cud(i,j,k); - - } else if (k == nz-1) { - - Real hzeta_inv_on_zlo = 8.0 / ( (zp(i,j,k+1) + zp(i+1,j,k+1) + zp(i,j+1,k+1) + zp(i+1,j+1,k+1)) - -(zp(i,j,k-1) + zp(i+1,j,k-1) + zp(i,j+1,k-1) + zp(i+1,j+1,k-1)) ); - Real h_xi_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i+1,j,k ) - zp(i,j+1,k ) - zp(i,j,k )) * dxinv; - Real h_eta_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i,j+1,k ) - zp(i+1,j,k ) - zp(i,j,k )) * dyinv; - ald(i,j,k) = hzeta_inv_on_cc * (1.0 + h_xi_on_zlo*h_xi_on_zlo + h_eta_on_zlo*h_eta_on_zlo) * hzeta_inv_on_zlo; - cud(i,j,k) = 0.; - bd(i,j,k) = k2 - ald(i,j,k) - cud(i,j,k); - if (i == 0 && j == 0) { - bd(i,j,k) *= 2.0; - } - } else { - Real hzeta_inv_on_zlo = 8.0 / ( (zp(i,j,k+1) + zp(i+1,j,k+1) + zp(i,j+1,k+1) + zp(i+1,j+1,k+1)) - -(zp(i,j,k-1) + zp(i+1,j,k-1) + zp(i,j+1,k-1) + zp(i+1,j+1,k-1)) ); - Real h_xi_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i+1,j,k ) - zp(i,j+1,k ) - zp(i,j,k )) * dxinv; - Real h_eta_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i,j+1,k ) - zp(i+1,j,k ) - zp(i,j,k )) * dyinv; - - Real hzeta_inv_on_zhi = 8.0 / ( (zp(i,j,k+2) + zp(i+1,j,k+2) + zp(i,j+1,k+2) + zp(i+1,j+1,k+2)) - -(zp(i,j,k ) + zp(i+1,j,k ) + zp(i,j+1,k ) + zp(i+1,j+1,k )) ); - Real h_xi_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i+1,j,k+1) - zp(i,j+1,k+1) - zp(i,j,k+1)) * dxinv; - Real h_eta_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i,j+1,k+1) - zp(i+1,j,k+1) - zp(i,j,k+1)) * dyinv; - - ald(i,j,k) = hzeta_inv_on_cc * (1.0 + h_xi_on_zlo*h_xi_on_zlo + h_eta_on_zlo*h_eta_on_zlo) * hzeta_inv_on_zlo; - cud(i,j,k) = hzeta_inv_on_cc * (1.0 + h_xi_on_zhi*h_xi_on_zhi + h_eta_on_zhi*h_eta_on_zhi) * hzeta_inv_on_zhi; - bd(i,j,k) = k2 - ald(i,j,k) - cud(i,j,k); - - } - } - - scratch(i,j,0) = cud(i,j,0)/bd(i,j,0); - spectral(i,j,0) = spectral(i,j,0)/bd(i,j,0); - - for (int k = 1; k < nz; k++) { - if (k < nz-1) { - scratch(i,j,k) = cud(i,j,k) / (bd(i,j,k) - ald(i,j,k) * scratch(i,j,k-1)); - } - spectral(i,j,k) = (spectral(i,j,k) - ald(i,j,k) * spectral(i,j,k - 1)) - / (bd(i,j,k) - ald(i,j,k) * scratch(i,j,k-1)); - } - - for (int k = nz - 2; k >= 0; k--) { - spectral(i,j,k) -= scratch(i,j,k) * spectral(i,j,k + 1); - } - - for (int k = 0; k < nz; ++k) { - spectral(i,j,k) *= scale; - } - }); - Gpu::streamSynchronize(); - -#else - - Gpu::DeviceVector> ald(nz); - Gpu::DeviceVector> bd(nz); - Gpu::DeviceVector> cud(nz); - Gpu::DeviceVector> scratch(nz); - - amrex::LoopOnCpu(xybox, [&] (int i, int j, int) - { - T a = facx*i; - T b = (j < ny/2) ? facy*j : facy*(ny-j); - - T k2 = T(2)*(std::cos(a*dx)-T(1))/(dx*dx) - + T(2)*(std::cos(b*dy)-T(1))/(dy*dy); - - // Tridiagonal solve with homogeneous Neumann - for(int k=0; k < nz; k++) { - - Real hzeta_inv_on_cc = 4.0 / ( (zp(i,j,k+1) + zp(i+1,j,k+1) + zp(i,j+1,k+1) + zp(i+1,j+1,k+1)) - -(zp(i,j,k ) + zp(i+1,j,k ) + zp(i,j+1,k ) + zp(i+1,j+1,k )) ); - - if(k==0) { - - Real hzeta_inv_on_zhi = 8.0 / ( (zp(i,j,k+2) + zp(i+1,j,k+2) + zp(i,j+1,k+2) + zp(i+1,j+1,k+2)) - -(zp(i,j,k ) + zp(i+1,j,k ) + zp(i,j+1,k ) + zp(i+1,j+1,k )) ); - Real h_xi_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i+1,j,k+1) - zp(i,j+1,k+1) - zp(i,j,k+1)) * dxinv; - Real h_eta_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i,j+1,k+1) - zp(i+1,j,k+1) - zp(i,j,k+1)) * dyinv; - - ald[k] = 0.; - cud[k] = hzeta_inv_on_cc * (1.0 + h_xi_on_zhi*h_xi_on_zhi + h_eta_on_zhi*h_eta_on_zhi) * hzeta_inv_on_zhi; - bd[k] = k2 -ald[k]-cud[k]; - - } else if (k == nz-1) { - - Real hzeta_inv_on_zlo = 8.0 / ( (zp(i,j,k+1) + zp(i+1,j,k+1) + zp(i,j+1,k+1) + zp(i+1,j+1,k+1)) - -(zp(i,j,k-1) + zp(i+1,j,k-1) + zp(i,j+1,k-1) + zp(i+1,j+1,k-1)) ); - Real h_xi_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i+1,j,k ) - zp(i,j+1,k ) - zp(i,j,k )) * dxinv; - Real h_eta_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i,j+1,k ) - zp(i+1,j,k ) - zp(i,j,k )) * dyinv; - - ald[k] = hzeta_inv_on_cc * (1.0 + h_xi_on_zlo*h_xi_on_zlo + h_eta_on_zlo*h_eta_on_zlo) * hzeta_inv_on_zlo; - cud[k] = 0.; - bd[k] = k2 -ald[k]-cud[k]; - - if (i == 0 && j == 0) { - bd[k] *= 2.0; - } - } else { - - Real hzeta_inv_on_zlo = 8.0 / ( (zp(i,j,k+1) + zp(i+1,j,k+1) + zp(i,j+1,k+1) + zp(i+1,j+1,k+1)) - -(zp(i,j,k-1) + zp(i+1,j,k-1) + zp(i,j+1,k-1) + zp(i+1,j+1,k-1)) ); - Real h_xi_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i+1,j,k ) - zp(i,j+1,k ) - zp(i,j,k )) * dxinv; - Real h_eta_on_zlo = 0.5 * (zp(i+1,j+1,k ) + zp(i,j+1,k ) - zp(i+1,j,k ) - zp(i,j,k )) * dyinv; - - Real hzeta_inv_on_zhi = 8.0 / ( (zp(i,j,k+2) + zp(i+1,j,k+2) + zp(i,j+1,k+2) + zp(i+1,j+1,k+2)) - -(zp(i,j,k ) + zp(i+1,j,k ) + zp(i,j+1,k ) + zp(i+1,j+1,k )) ); - Real h_xi_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i+1,j,k+1) - zp(i,j+1,k+1) - zp(i,j,k+1)) * dxinv; - Real h_eta_on_zhi = 0.5 * (zp(i+1,j+1,k+1) + zp(i,j+1,k+1) - zp(i+1,j,k+1) - zp(i,j,k+1)) * dyinv; - - ald[k] = hzeta_inv_on_cc * (1.0 + h_xi_on_zlo*h_xi_on_zlo + h_eta_on_zlo*h_eta_on_zlo) * hzeta_inv_on_zlo; - cud[k] = hzeta_inv_on_cc * (1.0 + h_xi_on_zhi*h_xi_on_zhi + h_eta_on_zhi*h_eta_on_zhi) * hzeta_inv_on_zhi; - bd[k] = k2 - ald[k] - cud[k]; - } - } - - scratch[0] = cud[0]/bd[0]; - spectral(i,j,0) = spectral(i,j,0)/bd[0]; - - for (int k = 1; k < nz; k++) { - if (k < nz-1) { - scratch[k] = cud[k] / (bd[k] - ald[k] * scratch[k-1]); - } - spectral(i,j,k) = (spectral(i,j,k) - ald[k] * spectral(i,j,k - 1)) - / (bd[k] - ald[k] * scratch[k-1]); - } - - for (int k = nz - 2; k >= 0; k--) { - spectral(i,j,k) -= scratch[k] * spectral(i,j,k + 1); - } - - for (int k = 0; k < nz; ++k) { - spectral(i,j,k) *= scale; - } - }); -#endif - } - - m_r2c.backward(spmf, soln); -#endif -} - -} - -#endif diff --git a/Source/LinearSolvers/ERF_FFT_Utils.H b/Source/LinearSolvers/ERF_FFT_Utils.H new file mode 100644 index 000000000..c5ae0556d --- /dev/null +++ b/Source/LinearSolvers/ERF_FFT_Utils.H @@ -0,0 +1,73 @@ +#ifndef ERF_FFT_UTILS_H_ +#define ERF_FFT_UTILS_H_ + +#ifdef ERF_USE_FFT + +using namespace amrex; + +inline Array,AMREX_SPACEDIM> +get_fft_bc (Geometry const& lev_geom, + Array l_domain_bc_type, + Box const& bounding_box) noexcept +{ + Array,AMREX_SPACEDIM> r; + + for (int dir = 0; dir <= 1; dir++) + { + auto bc_type_lo = l_domain_bc_type[Orientation(dir,Orientation::low)]; + auto bc_type_hi = l_domain_bc_type[Orientation(dir,Orientation::high)]; + + if ( lev_geom.isPeriodic(dir) && + (lev_geom.Domain().smallEnd(dir) == bounding_box.smallEnd(dir)) && + (lev_geom.Domain().bigEnd(dir) == bounding_box.bigEnd(dir)) ) { + r[dir] = std::make_pair(FFT::Boundary::periodic,FFT::Boundary::periodic); + amrex::Print() << "SETTING " << dir << " TO PERIODIC " << std::endl; + } + + else if ( (lev_geom.Domain().smallEnd(dir) == bounding_box.smallEnd(dir)) && + (lev_geom.Domain().bigEnd(dir) == bounding_box.bigEnd(dir)) && + (bc_type_lo != "Outflow" && bc_type_lo != "Open") && + (bc_type_hi != "Outflow" && bc_type_hi != "Open") ) + { + r[dir] = std::make_pair(FFT::Boundary::even,FFT::Boundary::even); + amrex::Print() << "SETTING " << dir << " TO EVEN EVEN " << std::endl; + } + + else if ( (lev_geom.Domain().smallEnd(dir) == bounding_box.smallEnd(dir)) && + (lev_geom.Domain().bigEnd(dir) == bounding_box.bigEnd(dir)) && + (bc_type_lo == "Outflow" || bc_type_lo == "Open") && + (bc_type_hi == "Outflow" || bc_type_hi == "Open") ) + { + r[dir] = std::make_pair(FFT::Boundary::odd,FFT::Boundary::odd); + amrex::Print() << "SETTING " << dir << " TO ODD ODD " << std::endl; + } + + else if ( (lev_geom.Domain().smallEnd(dir) == bounding_box.smallEnd(dir)) && + (bc_type_lo == "Outflow" || bc_type_lo == "Open") ) + { + r[dir] = std::make_pair(FFT::Boundary::odd,FFT::Boundary::even); + amrex::Print() << "SETTING " << dir << " TO ODD EVEN " << std::endl; + } + + else if ( (lev_geom.Domain().bigEnd(dir) == bounding_box.bigEnd(dir)) && + (bc_type_hi == "Outflow" || bc_type_hi == "Open") ) + { + r[dir] = std::make_pair(FFT::Boundary::even,FFT::Boundary::odd); + amrex::Print() << "SETTING " << dir << " TO EVEN ODD " << std::endl; + } + else + { + r[dir] = std::make_pair(FFT::Boundary::even,FFT::Boundary::even); + amrex::Print() << "SETTING " << dir << " TO EVEN EVEN " << std::endl; + } + } // dir + + // + // Always Neumann in the vertical + // + r[2] = std::make_pair(FFT::Boundary::even,FFT::Boundary::even); + + return r; +} +#endif +#endif diff --git a/Source/LinearSolvers/ERF_PoissonSolve.cpp b/Source/LinearSolvers/ERF_PoissonSolve.cpp index 0a80fe725..0e8db53a1 100644 --- a/Source/LinearSolvers/ERF_PoissonSolve.cpp +++ b/Source/LinearSolvers/ERF_PoissonSolve.cpp @@ -121,7 +121,8 @@ void ERF::project_velocities (int lev, Real l_dt, Vector& mom_mf, Mult #else #ifdef ERF_USE_FFT - bool boxes_make_rectangle = (geom_tmp[0].Domain().numPts() == ba_tmp[0].numPts()); + Box my_region(ba_tmp[0].minimalBox()); + bool boxes_make_rectangle = (my_region.numPts() == ba_tmp[0].numPts()); #endif // **************************************************************************** @@ -141,7 +142,7 @@ void ERF::project_velocities (int lev, Real l_dt, Vector& mom_mf, Mult } #else if (use_fft) { - amrex::Warning("use_fft can't be used unless you build with USE_FFT = TRUE; defaulting to MLMG"); + amrex::Warning("You set use_fft=true but didn't build with USE_FFT = TRUE; defaulting to MLMG"); } solve_with_mlmg(lev, rhs, phi, fluxes); #endif @@ -158,7 +159,7 @@ void ERF::project_velocities (int lev, Real l_dt, Vector& mom_mf, Mult amrex::Abort("FFT won't work unless the boxArray covers the domain"); } else { if (!use_fft) { - amrex::Warning("Using FFT even though you didn't set use_fft = 0; it's the best choice"); + amrex::Warning("Using FFT even though you didn't set use_fft to true; it's the best choice"); } solve_with_fft(lev, rhs[0], phi[0], fluxes[0]); } @@ -172,12 +173,12 @@ void ERF::project_velocities (int lev, Real l_dt, Vector& mom_mf, Mult #ifdef ERF_USE_FFT if (use_fft) { - amrex::Warning("FFT solver does not work for general terrain: switching to GMRES"); + amrex::Warning("FFT solver does not work for general terrain: switching to FFT-preconditioned GMRES"); } if (!boxes_make_rectangle) { amrex::Abort("FFT preconditioner for GMRES won't work unless the boxArray covers the domain"); } else { - solve_with_gmres(lev, rhs, phi, fluxes[0]); + solve_with_gmres(lev, rhs, phi, fluxes); } #else amrex::Abort("Rebuild with USE_FFT = TRUE so you can use the FFT preconditioner for GMRES"); diff --git a/Source/LinearSolvers/ERF_TerrainPoisson.H b/Source/LinearSolvers/ERF_TerrainPoisson.H index 40fdc95a1..97efd6afe 100644 --- a/Source/LinearSolvers/ERF_TerrainPoisson.H +++ b/Source/LinearSolvers/ERF_TerrainPoisson.H @@ -2,8 +2,9 @@ #define ERF_TERRAIN_POISSON_H_ #include "ERF_TerrainPoisson_3D_K.H" + #ifdef ERF_USE_FFT -#include "ERF_FFT_TerrainPrecond.H" +#include #endif #include @@ -17,7 +18,9 @@ public: TerrainPoisson (amrex::Geometry const& geom, amrex::BoxArray const& ba, amrex::DistributionMapping const& dm, - amrex::MultiFab const* z_phys_nd); + amrex::Gpu::DeviceVector& stretched_dz_lev_d, + amrex::MultiFab const* z_phys_nd, + amrex::Array& domain_bc_type); void apply(amrex::MultiFab& lhs, amrex::MultiFab const& rhs); @@ -51,9 +54,11 @@ private: amrex::Geometry m_geom; amrex::BoxArray m_grids; amrex::DistributionMapping m_dmap; + amrex::Gpu::DeviceVector m_stretched_dz_d; const amrex::MultiFab* m_zphys; + #ifdef ERF_USE_FFT - std::unique_ptr> m_2D_fft_precond; + std::unique_ptr> m_2D_fft_precond; #endif }; diff --git a/Source/LinearSolvers/ERF_TerrainPoisson.cpp b/Source/LinearSolvers/ERF_TerrainPoisson.cpp index 7e4b354fe..fd2214d27 100644 --- a/Source/LinearSolvers/ERF_TerrainPoisson.cpp +++ b/Source/LinearSolvers/ERF_TerrainPoisson.cpp @@ -1,28 +1,36 @@ #include "ERF_TerrainPoisson.H" +#include "ERF_FFT_Utils.H" using namespace amrex; TerrainPoisson::TerrainPoisson (Geometry const& geom, BoxArray const& ba, DistributionMapping const& dm, - MultiFab const* z_phys_nd) + Gpu::DeviceVector& stretched_dz_lev_d, + MultiFab const* z_phys_nd, + Array& domain_bc_type) : m_geom(geom), m_grids(ba), m_dmap(dm), + m_stretched_dz_d(stretched_dz_lev_d), m_zphys(z_phys_nd) { #ifdef ERF_USE_FFT if (!m_2D_fft_precond) { - m_2D_fft_precond = std::make_unique>(geom); + Box bounding_box = ba.minimalBox(); + auto bc_fft = get_fft_bc(geom,domain_bc_type,bounding_box); + m_2D_fft_precond = std::make_unique>(geom,bc_fft); } +#else + amrex::ignore_unused(domain_bc_type); #endif } -void TerrainPoisson::usePrecond(bool use_precond_in) +void TerrainPoisson::usePrecond (bool use_precond_in) { m_use_precond = use_precond_in; } -void TerrainPoisson::apply(MultiFab& lhs, MultiFab const& rhs) +void TerrainPoisson::apply (MultiFab& lhs, MultiFab const& rhs) { AMREX_ASSERT(rhs.nGrowVect().allGT(0)); @@ -90,12 +98,12 @@ void TerrainPoisson::apply(MultiFab& lhs, MultiFab const& rhs) auto const& xc = xx.const_arrays(); ParallelFor(rhs, [=] AMREX_GPU_DEVICE (int b, int i, int j, int k) { - terrpoisson_adotx(i,j,k,y[b], xc[b], zpa[b], dxinv[0], dxinv[1]); + terrpoisson_adotx(i, j, k, y[b], xc[b], zpa[b], dxinv[0], dxinv[1]); }); } -void TerrainPoisson::getFluxes(MultiFab& phi, - Array& fluxes) +void TerrainPoisson::getFluxes (MultiFab& phi, + Array& fluxes) { auto const& dxinv = m_geom.InvCellSizeArray(); @@ -144,53 +152,92 @@ void TerrainPoisson::getFluxes(MultiFab& phi, }); } -void TerrainPoisson::assign(MultiFab& lhs, MultiFab const& rhs) +void TerrainPoisson::assign (MultiFab& lhs, MultiFab const& rhs) { MultiFab::Copy(lhs, rhs, 0, 0, 1, 0); } -void TerrainPoisson::scale(MultiFab& lhs, Real fac) +void TerrainPoisson::scale (MultiFab& lhs, Real fac) { lhs.mult(fac); } -Real TerrainPoisson::dotProduct(MultiFab const& v1, MultiFab const& v2) +Real TerrainPoisson::dotProduct (MultiFab const& v1, MultiFab const& v2) { return MultiFab::Dot(v1, 0, v2, 0, 1, 0); } -void TerrainPoisson::increment(MultiFab& lhs, MultiFab const& rhs, Real a) +void TerrainPoisson::increment (MultiFab& lhs, MultiFab const& rhs, Real a) { MultiFab::Saxpy(lhs, a, rhs, 0, 0, 1, 0); } -void TerrainPoisson::linComb(MultiFab& lhs, Real a, MultiFab const& rhs_a, - Real b, MultiFab const& rhs_b) +void TerrainPoisson::linComb (MultiFab& lhs, Real a, MultiFab const& rhs_a, + Real b, MultiFab const& rhs_b) { MultiFab::LinComb(lhs, a, rhs_a, 0, b, rhs_b, 0, 0, 1, 0); } -MultiFab TerrainPoisson::makeVecRHS() +MultiFab TerrainPoisson::makeVecRHS () { return MultiFab(m_grids, m_dmap, 1, 0); } -MultiFab TerrainPoisson::makeVecLHS() +MultiFab TerrainPoisson::makeVecLHS () { return MultiFab(m_grids, m_dmap, 1, 1); } -Real TerrainPoisson::norm2(MultiFab const& v) +Real TerrainPoisson::norm2 (MultiFab const& v) { return v.norm2(); } -void TerrainPoisson::precond(MultiFab& lhs, MultiFab const& rhs) +void TerrainPoisson::precond (MultiFab& lhs, MultiFab const& rhs) { #ifdef ERF_USE_FFT - if (m_use_precond) { - m_2D_fft_precond->solve(lhs, rhs, *m_zphys); + if (m_use_precond) + { + amrex::Print() << "Using the hybrid FFT solver as a preconditioner..." << std::endl; + + // Make a version that isn't constant + MultiFab& rhs_tmp = const_cast(rhs); + + lhs.setVal(0.); + m_2D_fft_precond->solve(lhs, rhs_tmp, m_stretched_dz_d); +#if 0 + AMREX_ASSERT(m_zphys_fft.local_size() <= 1); + FArrayBox const* zfab = nullptr; + if (m_zphys_fft.local_size() == 1) { + zfab = m_zphys_fft.fabPtr(m_zphys_fft.IndexArray()[0]); + } + auto za = zfab ? zfab->const_array() : Array4{}; + auto dxinv = m_geom.InvCellSize(0); + auto dyinv = m_geom.InvCellSize(1); + m_2D_fft_precond->solve(lhs, rhs, + [=] AMREX_GPU_DEVICE (int ii, int jj, int k) -> Real + { + int i = 0; int j = 0; + Real hzeta_inv_on_cc = Real(4.0) / ( (za(i,j,k+1) + za(i+1,j,k+1) + za(i,j+1,k+1) + za(i+1,j+1,k+1)) + -(za(i,j,k ) + za(i+1,j,k ) + za(i,j+1,k ) + za(i+1,j+1,k )) ); + eal hzeta_inv_on_zlo = Real(8.0) / ( (za(i,j,k+1) + za(i+1,j,k+1) + za(i,j+1,k+1) + za(i+1,j+1,k+1)) + -(za(i,j,k-1) + za(i+1,j,k-1) + za(i,j+1,k-1) + za(i+1,j+1,k-1)) ); + Real h_xi_on_zlo = Real(0.5) * (za(i+1,j+1,k ) + za(i+1,j,k ) - za(i,j+1,k ) - za(i,j,k )) * dxinv; + Real h_eta_on_zlo = Real(0.5) * (za(i+1,j+1,k ) + za(i,j+1,k ) - za(i+1,j,k ) - za(i,j,k )) * dyinv; + return hzeta_inv_on_cc * (Real(1.0) + h_xi_on_zlo*h_xi_on_zlo + h_eta_on_zlo*h_eta_on_zlo) * hzeta_inv_on_zlo; + }, + [=] AMREX_GPU_DEVICE (int ii, int jj, int k) -> Real + { + Real hzeta_inv_on_cc = Real(4.0) / ( (za(i,j,k+1) + za(i+1,j,k+1) + za(i,j+1,k+1) + za(i+1,j+1,k+1)) + -(za(i,j,k ) + za(i+1,j,k ) + za(i,j+1,k ) + za(i+1,j+1,k )) ); + Real hzeta_inv_on_zhi = Real(8.0) / ( (za(i,j,k+2) + za(i+1,j,k+2) + za(i,j+1,k+2) + za(i+1,j+1,k+2)) + -(za(i,j,k ) + za(i+1,j,k ) + za(i,j+1,k ) + za(i+1,j+1,k )) ); + Real h_xi_on_zhi = Real(0.5) * (za(i+1,j+1,k+1) + za(i+1,j,k+1) - za(i,j+1,k+1) - za(i,j,k+1)) * dxinv; + Real h_eta_on_zhi = Real(0.5) * (za(i+1,j+1,k+1) + za(i,j+1,k+1) - za(i+1,j,k+1) - za(i,j,k+1)) * dyinv; + return hzeta_inv_on_cc * (Real(1.0) + h_xi_on_zhi*h_xi_on_zhi + h_eta_on_zhi*h_eta_on_zhi) * hzeta_inv_on_zhi; + }); +#endif } else #endif { diff --git a/Source/LinearSolvers/ERF_solve_with_fft.cpp b/Source/LinearSolvers/ERF_solve_with_fft.cpp index 291cacad4..2e268dd96 100644 --- a/Source/LinearSolvers/ERF_solve_with_fft.cpp +++ b/Source/LinearSolvers/ERF_solve_with_fft.cpp @@ -1,47 +1,9 @@ #include "ERF.H" -#include "ERF_Utils.H" +#include "ERF_FFT_Utils.H" using namespace amrex; #ifdef ERF_USE_FFT -Array,AMREX_SPACEDIM> -ERF::get_fft_bc () const noexcept -{ - // - // This logic only works for level 0 - // TODO: fix for level > 0 - // - Array,AMREX_SPACEDIM> r; - - for (int dir = 0; dir <= 1; dir++) { - if (geom[0].isPeriodic(dir)) { - r[dir] = std::make_pair(FFT::Boundary::periodic,FFT::Boundary::periodic); - } - } // dir - - for (OrientationIter ori; ori != nullptr; ++ori) { - const int dir = ori().coordDir(); - if (!geom[0].isPeriodic(dir) && ori().faceDir() == Orientation::low) { - auto bc_type_lo = domain_bc_type[Orientation(dir,Orientation::low)]; - auto bc_type_hi = domain_bc_type[Orientation(dir,Orientation::high)]; - if ( (bc_type_lo == "Outflow" || bc_type_lo == "Open") && - (bc_type_hi == "Outflow" || bc_type_hi == "Open") ) { - r[dir] = std::make_pair(FFT::Boundary::odd,FFT::Boundary::odd); - } else if ( (bc_type_lo != "Outflow" && bc_type_lo != "Open") && - (bc_type_hi == "Outflow" || bc_type_hi == "Outflow") ) { - r[dir] = std::make_pair(FFT::Boundary::even,FFT::Boundary::odd); - } else if ( (bc_type_lo == "Outflow" || bc_type_lo == "Open") && - (bc_type_hi != "Outflow" && bc_type_hi != "Outflow") ) { - r[dir] = std::make_pair(FFT::Boundary::odd,FFT::Boundary::even); - } else { - r[dir] = std::make_pair(FFT::Boundary::even,FFT::Boundary::even); - } - } // not periodic - } // ori - - return r; -} - /** * Solve the Poisson equation using FFT * Note that the level may or may not be level 0. @@ -50,30 +12,22 @@ void ERF::solve_with_fft (int lev, MultiFab& rhs, MultiFab& phi, Array 0 - AMREX_ALWAYS_ASSERT(lev == 0); - bool l_use_terrain = SolverChoice::terrain_type != TerrainType::None; auto const dom_lo = lbound(geom[lev].Domain()); auto const dom_hi = ubound(geom[lev].Domain()); - auto bclo = get_projection_bc(Orientation::low); - auto bchi = get_projection_bc(Orientation::high); - - // amrex::Print() << "BCLO " << bclo[0] << " " << bclo[1] << " " << bclo[2] << std::endl; - // amrex::Print() << "BCHI " << bchi[0] << " " << bchi[1] << " " << bchi[2] << std::endl; - auto dxInv = geom[lev].InvCellSizeArray(); Real reltol = solverChoice.poisson_reltol; Real abstol = solverChoice.poisson_abstol; + Box bounding_box(rhs.boxArray().minimalBox()); + auto bc_fft = get_fft_bc(geom[lev],domain_bc_type,bounding_box); + // **************************************************************************** // FFT solve // **************************************************************************** - AMREX_ALWAYS_ASSERT(lev == 0); // // No terrain or stretched grids // This calls the full 3D FFT solver with bc's set through bc_fft @@ -83,30 +37,28 @@ void ERF::solve_with_fft (int lev, MultiFab& rhs, MultiFab& phi, Array 0) { amrex::Print() << "Using the 3D FFT solver..." << std::endl; } - if (!m_3D_poisson) { - auto bc_fft = get_fft_bc(); - m_3D_poisson = std::make_unique>(Geom(0),bc_fft); + if (m_3D_poisson.size() <= lev) { + m_3D_poisson.resize(lev+1); + m_3D_poisson[lev] = std::make_unique>(Geom(lev),bc_fft); } - m_3D_poisson->solve(phi, rhs); + m_3D_poisson[lev]->solve(phi, rhs); // // Stretched grids - // This calls the hybrid 2D FFT solver + tridiagonal in z - // - // For right now we can only do this solve for periodic in the x- and y-directions - // We assume Neumann at top and bottom z-boundaries - // This will be generalized in future // + // This calls the hybrid 2D FFT solver + tridiagonal in z with lateral bc's set through bc_fft + // and Neumann at top and bottom z-boundaries // } else if (l_use_terrain && SolverChoice::terrain_is_flat) { if (mg_verbose > 0) { amrex::Print() << "Using the hybrid FFT solver..." << std::endl; } - if (!m_2D_poisson) { - m_2D_poisson = std::make_unique>(Geom(0)); + if (m_2D_poisson.size() <= lev) { + m_2D_poisson.resize(lev+1); + m_2D_poisson[lev] = std::make_unique>(Geom(lev),bc_fft); } - m_2D_poisson->solve(phi, rhs, stretched_dz_d[lev]); + m_2D_poisson[lev]->solve(phi, rhs, stretched_dz_d[lev]); } else { amrex::Abort("FFT isn't appropriate for spatially varying terrain"); diff --git a/Source/LinearSolvers/ERF_solve_with_gmres.cpp b/Source/LinearSolvers/ERF_solve_with_gmres.cpp index d4ef6214e..9c05aaac0 100644 --- a/Source/LinearSolvers/ERF_solve_with_gmres.cpp +++ b/Source/LinearSolvers/ERF_solve_with_gmres.cpp @@ -9,7 +9,8 @@ using namespace amrex; /** * Solve the Poisson equation using GMRES */ -void ERF::solve_with_gmres (int lev, Vector& rhs, Vector& phi, Array& fluxes) +void ERF::solve_with_gmres (int lev, Vector& rhs, Vector& phi, + Vector>& fluxes) { BL_PROFILE("ERF::solve_with_gmres()"); @@ -18,7 +19,8 @@ void ERF::solve_with_gmres (int lev, Vector& rhs, Vector& ph amrex::GMRES gmsolver; - TerrainPoisson tp(geom[lev], rhs[lev].boxArray(), rhs[lev].DistributionMap(), z_phys_nd[lev].get()); + TerrainPoisson tp(geom[lev], rhs[0].boxArray(), rhs[0].DistributionMap(), stretched_dz_d[lev], + z_phys_nd[lev].get(), domain_bc_type); gmsolver.define(tp); @@ -28,5 +30,5 @@ void ERF::solve_with_gmres (int lev, Vector& rhs, Vector& ph gmsolver.solve(phi[0], rhs[0], reltol, abstol); - tp.getFluxes(phi[0], fluxes); + tp.getFluxes(phi[0], fluxes[0]); } diff --git a/Source/LinearSolvers/Make.package b/Source/LinearSolvers/Make.package index 7f25cdfca..55045c5f8 100644 --- a/Source/LinearSolvers/Make.package +++ b/Source/LinearSolvers/Make.package @@ -5,12 +5,12 @@ CEXE_sources += ERF_TerrainPoisson.cpp CEXE_sources += ERF_compute_divergence.cpp CEXE_sources += ERF_PoissonSolve.cpp CEXE_sources += ERF_PoissonSolve_tb.cpp -CEXE_sources += ERF_solve_with_fft.cpp CEXE_sources += ERF_solve_with_gmres.cpp CEXE_sources += ERF_solve_with_mlmg.cpp ifeq ($(USE_FFT), TRUE) -CEXE_headers += ERF_FFT_TerrainPrecond.H +CEXE_headers += ERF_FFT_Utils.H +CEXE_sources += ERF_solve_with_fft.cpp endif ifeq ($(USE_EB), TRUE)