From aa2c754822da42c4e4c6033b5415a019b5524c81 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Fri, 6 Dec 2024 12:55:18 +0000 Subject: [PATCH 01/23] Add LU preconditioner to electron_implicit_advance!() `electron_implicit_advance!()` attempts to solve for the steady-state g_e and backward-Euler p_e|| in a single Newton-Krylov solve. Adding an LU preconditioner might give it a chance of converging! --- .../src/electron_kinetic_equation.jl | 208 +++++++++++++++--- moment_kinetics/src/time_advance.jl | 37 +++- 2 files changed, 204 insertions(+), 41 deletions(-) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 2bf8685a1..8af3c0e06 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -1880,21 +1880,146 @@ to allow the outer r-loop to be parallelised. newton_success = false for ir ∈ 1:r.n + if nl_solver_params.preconditioner_type === Val(:electron_lu) + + if ion_dt > 1.5 * nl_solver_params.precon_dt[] || + ion_dt < 2.0/3.0 * nl_solver_params.precon_dt[] + + # dt has changed significantly, so update the preconditioner + nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval + end + + if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval +global_rank[] == 0 && println("recalculating precon") + nl_solver_params.solves_since_precon_update[] = 0 + nl_solver_params.precon_dt[] = ion_dt + + orig_lu, precon_matrix, input_buffer, output_buffer = + nl_solver_params.preconditioners[ir] + + fill_electron_kinetic_equation_Jacobian!( + precon_matrix, f_electron, ppar, moments, phi, collisions, + composition, z, vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, + z_advect, vpa_advect, scratch_dummy, external_source_settings, + num_diss_params, t_params, ion_dt, ir, true, :all, true, false) + + begin_serial_region() + if block_rank[] == 0 + if size(orig_lu) == (1, 1) + # Have not properly created the LU decomposition before, so + # cannot reuse it. + @timeit_debug global_timer "lu" nl_solver_params.preconditioners[ir] = + (lu(sparse(precon_matrix)), precon_matrix, input_buffer, + output_buffer) + else + # LU decomposition was previously created. The Jacobian always + # has the same sparsity pattern, so by using `lu!()` we can + # reuse some setup. + try + @timeit_debug global_timer "lu!" lu!(orig_lu, sparse(precon_matrix); check=false) + catch e + if !isa(e, ArgumentError) + rethrow(e) + end + println("Sparsity pattern of matrix changed, rebuilding " + * " LU from scratch") + @timeit_debug global_timer "lu" orig_lu = lu(sparse(precon_matrix)) + end + nl_solver_params.preconditioners[ir] = + (orig_lu, precon_matrix, input_buffer, output_buffer) + end + else + nl_solver_params.preconditioners[ir] = + (orig_lu, precon_matrix, input_buffer, output_buffer) + end + end + + @timeit_debug global_timer lu_precon!(x) = begin + precon_ppar, precon_f = x + + precon_lu, _, this_input_buffer, this_output_buffer = + nl_solver_params.preconditioners[ir] + + begin_serial_region() + counter = 1 + @loop_z_vperp_vpa iz ivperp ivpa begin + this_input_buffer[counter] = precon_f[ivpa,ivperp,iz] + counter += 1 + end + @loop_z iz begin + this_input_buffer[counter] = precon_ppar[iz] + counter += 1 + end + + begin_serial_region() + @serial_region begin + @timeit_debug global_timer "ldiv!" ldiv!(this_output_buffer, precon_lu, this_input_buffer) + end + + begin_serial_region() + counter = 1 + @loop_z_vperp_vpa iz ivperp ivpa begin + precon_f[ivpa,ivperp,iz] = this_output_buffer[counter] + counter += 1 + end + @loop_z iz begin + precon_ppar[iz] = this_output_buffer[counter] + counter += 1 + end + + # Ensure values of precon_f and precon_ppar are consistent across + # distributed-MPI block boundaries. For precon_f take the upwind + # value, and for precon_ppar take the average. + f_lower_endpoints = @view scratch_dummy.buffer_vpavperpr_1[:,:,ir] + f_upper_endpoints = @view scratch_dummy.buffer_vpavperpr_2[:,:,ir] + receive_buffer1 = @view scratch_dummy.buffer_vpavperpr_3[:,:,ir] + receive_buffer2 = @view scratch_dummy.buffer_vpavperpr_4[:,:,ir] + begin_vperp_vpa_region() + @loop_vperp_vpa ivperp ivpa begin + f_lower_endpoints[ivpa,ivperp] = precon_f[ivpa,ivperp,1] + f_upper_endpoints[ivpa,ivperp] = precon_f[ivpa,ivperp,end] + end + # We upwind the z-derivatives in `electron_z_advection!()`, so would + # expect that upwinding the results here in z would make sense. + # However, upwinding here makes convergence much slower (~10x), + # compared to picking the values from one side or other of the block + # boundary, or taking the average of the values on either side. + # Neither direction is special, so taking the average seems most + # sensible (although in an intial test it does not seem to converge + # faster than just picking one or the other). + # Maybe this could indicate that it is more important to have a fully + # self-consistent Jacobian inversion for the + # `electron_vpa_advection()` part rather than taking half(ish) of the + # values from one block and the other half(ish) from the other. + reconcile_element_boundaries_MPI_z_pdf_vpavperpz!( + precon_f, f_lower_endpoints, f_upper_endpoints, receive_buffer1, + receive_buffer2, z) + + begin_serial_region() + @serial_region begin + buffer_1[] = precon_ppar[1] + buffer_2[] = precon_ppar[end] + end + reconcile_element_boundaries_MPI!( + precon_ppar, buffer_1, buffer_2, buffer_3, buffer_4, z) + + return nothing + end + + left_preconditioner = identity + right_preconditioner = lu_precon! + elseif nl_solver_params.preconditioner_type === Val(:none) + left_preconditioner = identity + right_preconditioner = identity + else + error("preconditioner_type=$(nl_solver_params.preconditioner_type) is not " + * "supported by electron_backward_euler!().") + end + function residual_func!(residual, new_variables; debug=false, krylov=false) electron_ppar_residual, f_electron_residual = residual electron_ppar_new, f_electron_new = new_variables - apply_electron_bc_and_constraints_no_r!(f_electron_new, fields.phi, moments, - z, vperp, vpa, vperp_spectral, - vpa_spectral, vpa_advect, - num_diss_params, composition, ir) - - # Calculate heat flux and derivatives using new_variables - @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], - electron_ppar_new, - moments.electron.vth[:,ir], - f_electron_new, vpa, ir) - this_dens = moments.electron.dens this_upar = moments.electron.upar this_vth = moments.electron.vth @@ -1906,6 +2031,23 @@ to allow the outer r-loop to be parallelised. (this_dens[iz,ir] * composition.me_over_mi))) end + + # enforce the boundary condition(s) on the electron pdf + @views enforce_boundary_condition_on_electron_pdf!( + f_electron_new, phi, moments.electron.vth[:,ir], + moments.electron.upar[:,ir], z, vperp, vpa, vperp_spectral, + vpa_spectral, vpa_advect, moments, + num_diss_params.electron.vpa_dissipation_coefficient > 0.0, + composition.me_over_mi, ir; bc_constraints=false, + update_vcut=!krylov) + + # Calculate heat flux and derivatives using new_variables + @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], + electron_ppar_new, + moments.electron.vth[:,ir], + f_electron_new, vpa, ir) + + calculate_electron_moment_derivatives_no_r!( moments, (electron_density=this_dens, @@ -1937,10 +2079,8 @@ to allow the outer r-loop to be parallelised. f_electron_residual, electron_ppar_residual, f_electron_new, electron_ppar_new, moments, z, vperp, vpa, z_spectral, vpa_spectral, z_advect, vpa_advect, scratch_dummy, collisions, composition, external_source_settings, - num_diss_params, t_params, ir; soft_force_constraints=true) - @loop_z_vperp_vpa iz ivperp ivpa begin - f_electron_residual[ivpa,ivperp,iz] /= sqrt(1.0 + vpa.grid[ivpa]^2) - end + num_diss_params, t_params, ir; evolve_ppar=true, ion_dt=ion_dt, + soft_force_constraints=true) # Set residual to zero where pdf_electron is determined by boundary conditions. if vpa.n > 1 @@ -1972,13 +2112,12 @@ to allow the outer r-loop to be parallelised. w = (scratch_dummy.implicit_buffer_z_5, scratch_dummy.implicit_buffer_vpavperpz_5) - @views newton_success = newton_solve!((electron_ppar_out[:,ir], - pdf_electron_out[:,:,:,ir]), - residual_func!, residual, delta_x, - rhs_delta, v, w, nl_solver_params; - left_preconditioner=nothing, - right_preconditioner=nothing, - coords=(z=z, vperp=vperp, vpa=vpa)) + newton_success = newton_solve!((ppar, f_electron), residual_func!, residual, + delta_x, rhs_delta, v, w, nl_solver_params; + left_preconditioner=nothing, + right_preconditioner=nothing, + recalculate_preconditioner=recalculate_preconditioner!, + coords=(z=z, vperp=vperp, vpa=vpa)) if !newton_success break end @@ -4463,7 +4602,8 @@ end collisions, composition, external_source_settings, num_diss_params, t_params, ir; - evolve_ppar=false, ion_dt=nothing) + evolve_ppar=false, ion_dt=nothing, + soft_force_constraints=false) Do a forward-Euler update of the electron kinetic equation. @@ -4562,14 +4702,20 @@ end Fill a pre-allocated matrix with the Jacobian matrix for electron kinetic equation and (if `evolve_ppar=true`) the electron energy equation. + +`add_identity=false` can be passed to skip adding 1's on the diagonal. Doing this would +produce the Jacobian for a steady-state solve, rather than a backward-Euler timestep +solve. [Note that rows representing boundary points still need the 1 added to their +diagonal, as that 1 is used to impose the boundary condition, not to represent the 'new f' +in the time derivative term as it is for the non-boundary points.] """ @timeit global_timer fill_electron_kinetic_equation_Jacobian!( jacobian_matrix, f, ppar, moments, phi_global, collisions, composition, z, vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, z_advect, vpa_advect, scratch_dummy, external_source_settings, num_diss_params, t_params, ion_dt, ir, - evolve_ppar, include=:all, - include_qpar_integral_terms=true) = begin + evolve_ppar, include=:all, include_qpar_integral_terms=true, + add_identity=true) = begin dt = t_params.dt[] buffer_1 = @view scratch_dummy.buffer_rs_1[ir,1] @@ -4604,6 +4750,8 @@ Fill a pre-allocated matrix with the Jacobian matrix for electron kinetic equati pdf_size = z.n * vperp.n * vpa.n v_size = vperp.n * vpa.n + z_speed = @view z_advect[1].speed[:,:,:,ir] + # Initialise jacobian_matrix to the identity begin_z_vperp_vpa_region() @loop_z_vperp_vpa iz ivperp ivpa begin @@ -4611,7 +4759,11 @@ Fill a pre-allocated matrix with the Jacobian matrix for electron kinetic equati row = (iz - 1) * v_size + (ivperp - 1) * vpa.n + ivpa jacobian_matrix[row,:] .= 0.0 - if include === :all + if (include === :all + && (add_identity + || skip_f_electron_bc_points_in_Jacobian(iz, ivperp, ivpa, z, vperp, vpa, + z_speed)) + ) jacobian_matrix[row,row] += 1.0 end end @@ -4621,13 +4773,11 @@ Fill a pre-allocated matrix with the Jacobian matrix for electron kinetic equati row = pdf_size + iz jacobian_matrix[row,:] .= 0.0 - if include === :all + if include === :all && add_identity jacobian_matrix[row,row] += 1.0 end end - z_speed = @view z_advect[1].speed[:,:,:,ir] - if include ∈ (:all, :explicit_v) dpdf_dz = @view scratch_dummy.buffer_vpavperpzr_1[:,:,:,ir] begin_vperp_vpa_region() diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index 374262198..2c5704935 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -425,6 +425,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, end implicit_electron_ppar = false + implicit_electron_advance = false electron_preconditioner_type = nothing decrease_dt_iteration_threshold = t_input["decrease_dt_iteration_threshold"] increase_dt_iteration_threshold = t_input["increase_dt_iteration_threshold"] @@ -436,6 +437,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, elseif electron === false debug_io = nothing implicit_electron_ppar = false + implicit_electron_advance = false electron_preconditioner_type = nothing decrease_dt_iteration_threshold = -1 increase_dt_iteration_threshold = typemax(mk_int) @@ -448,6 +450,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, debug_io = nothing implicit_electron_ppar = (t_input["implicit_electron_ppar"] !== false) + implicit_electron_advance = (t_input["implicit_electron_advance"] !== false) if implicit_electron_ppar if t_input["implicit_electron_ppar"] === true if block_size[] == 1 @@ -469,6 +472,12 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, * "preconditioner to use - one of $precon_keys.") end end + elseif implicit_electron_advance + if t_input["implicit_electron_advance"] !== true + error("No options other than `true` supported yet for " + * "implicit_electron_advance.") + end + electron_preconditioner_type = Val(:electron_lu) else electron_preconditioner_type = Val(:none) end @@ -498,11 +507,10 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, mk_float(t_input["last_fail_proximity_factor"]), mk_float(t_input["minimum_dt"]), mk_float(t_input["maximum_dt"]), electron !== nothing && t_input["implicit_braginskii_conduction"], - electron !== nothing && t_input["implicit_electron_advance"], + implicit_electron_advance, electron !== nothing && t_input["implicit_ion_advance"], electron !== nothing && t_input["implicit_vpa_advection"], - electron !== nothing && implicit_electron_ppar, - electron_preconditioner_type, + implicit_electron_ppar, electron_preconditioner_type, mk_float(t_input["constraint_forcing_rate"]), decrease_dt_iteration_threshold, increase_dt_iteration_threshold, mk_float(cap_factor_ion_dt), mk_int(max_pseudotimesteps), @@ -3578,15 +3586,20 @@ end neutral_z_advect, neutral_r_advect, neutral_vz_advect = advect_objects.neutral_z_advect, advect_objects.neutral_r_advect, advect_objects.neutral_vz_advect if t_params.implicit_electron_advance - success = implicit_electron_advance!(fvec_out, fvec_in, pdf, scratch_electron, - moments, fields, collisions, composition, - geometry, external_source_settings, - num_diss_params, r, z, vperp, vpa, - r_spectral, z_spectral, vperp_spectral, - vpa_spectral, electron_z_advect, - electron_vpa_advect, gyroavs, scratch_dummy, - t_params.electron, t_params.dt[], - nl_solver_params.electron_advance) + electron_success = implicit_electron_advance!(fvec_out, fvec_in, pdf, + scratch_electron, moments, fields, + collisions, composition, geometry, + external_source_settings, + num_diss_params, r, z, vperp, vpa, + r_spectral, z_spectral, + vperp_spectral, vpa_spectral, + electron_z_advect, + electron_vpa_advect, gyroavs, + scratch_dummy, t_params.electron, + dt, + nl_solver_params.electron_advance) + + success = (electron_success == "") elseif t_params.implicit_electron_ppar max_electron_pdf_iterations = t_params.electron.max_pseudotimesteps max_electron_sim_time = t_params.electron.max_pseudotime From 0e8bf153573170763dbfb51af764ea6f813ce445 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Fri, 6 Dec 2024 21:16:19 +0000 Subject: [PATCH 02/23] Recalculate the preconditioner if number of Newton iterations gets large When number of Newton iterations reaches (multiples of) the `preconditioner_update_interval`, assume convergence is getting slow and recalculate the preconditioner. --- .../src/electron_kinetic_equation.jl | 29 +++++++++++++------ moment_kinetics/src/nonlinear_solvers.jl | 16 ++++++++-- 2 files changed, 33 insertions(+), 12 deletions(-) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 8af3c0e06..1852d0321 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -1880,16 +1880,12 @@ to allow the outer r-loop to be parallelised. newton_success = false for ir ∈ 1:r.n - if nl_solver_params.preconditioner_type === Val(:electron_lu) - - if ion_dt > 1.5 * nl_solver_params.precon_dt[] || - ion_dt < 2.0/3.0 * nl_solver_params.precon_dt[] - - # dt has changed significantly, so update the preconditioner - nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval - end + f_electron = @view pdf_electron_out[:,:,:,ir] + ppar = @view electron_ppar_out[:,ir] + phi = @view fields.phi[:,ir] - if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval + function recalculate_preconditioner!() + if nl_solver_params.preconditioner_type === Val(:electron_lu) global_rank[] == 0 && println("recalculating precon") nl_solver_params.solves_since_precon_update[] = 0 nl_solver_params.precon_dt[] = ion_dt @@ -1932,6 +1928,21 @@ global_rank[] == 0 && println("recalculating precon") nl_solver_params.preconditioners[ir] = (orig_lu, precon_matrix, input_buffer, output_buffer) end + + return nothing + end + end + + if nl_solver_params.preconditioner_type === Val(:electron_lu) + if ion_dt > 1.5 * nl_solver_params.precon_dt[] || + ion_dt < 2.0/3.0 * nl_solver_params.precon_dt[] + + # dt has changed significantly, so update the preconditioner + nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval + end + + if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval + recalculate_preconditioner!() end @timeit_debug global_timer lu_precon!(x) = begin diff --git a/moment_kinetics/src/nonlinear_solvers.jl b/moment_kinetics/src/nonlinear_solvers.jl index aeeb43436..7ba24ea37 100644 --- a/moment_kinetics/src/nonlinear_solvers.jl +++ b/moment_kinetics/src/nonlinear_solvers.jl @@ -393,17 +393,21 @@ is not necessary to have a very tight `linear_rtol` for the GMRES solve. @timeit global_timer newton_solve!( x, residual_func!, residual, delta_x, rhs_delta, v, w, nl_solver_params; left_preconditioner=nothing, - right_preconditioner=nothing, coords) = begin + right_preconditioner=nothing, recalculate_preconditioner=nothing, + coords) = begin # This wrapper function constructs the `solver_type` from coords, so that the body of # the inner `newton_solve!()` can be fully type-stable solver_type = Val(Symbol((c for c ∈ keys(coords))...)) return newton_solve!(x, residual_func!, residual, delta_x, rhs_delta, v, w, nl_solver_params, solver_type; left_preconditioner=left_preconditioner, - right_preconditioner=right_preconditioner, coords=coords) + right_preconditioner=right_preconditioner, + recalculate_preconditioner=recalculate_preconditioner, + coords=coords) end function newton_solve!(x, residual_func!, residual, delta_x, rhs_delta, v, w, nl_solver_params, solver_type::Val; left_preconditioner=nothing, - right_preconditioner=nothing, coords) + right_preconditioner=nothing, recalculate_preconditioner=nothing, + coords) rtol = nl_solver_params.rtol atol = nl_solver_params.atol @@ -512,6 +516,12 @@ old_precon_iterations = nl_solver_params.precon_iterations[] parallel_map(solver_type, (w) -> w, x, w) previous_residual_norm = residual_norm + if recalculate_preconditioner !== nothing && counter % nl_solver_params.preconditioner_update_interval == 0 + # Have taken a large number of Newton iterations already - convergence must be + # slow, so try updating the preconditioner. + recalculate_preconditioner() + end + #println("Newton residual ", residual_norm, " ", linear_its, " $rtol $atol") if residual_norm < 0.1/rtol && close_counter < 0 && close_linear_counter < 0 From f338aa9d103cde125ef6803cf4908e990c756ee9 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 7 Dec 2024 17:15:31 +0000 Subject: [PATCH 03/23] Refactor single electron backward euler step into separate function ...renaming the function that executes a pseudotimestepping loop with several `electron_backward_euler!()` calls to `electron_backward_euler_pseudotimestepping!()`. --- .../src/electron_kinetic_equation.jl | 1719 +++++++++-------- 1 file changed, 891 insertions(+), 828 deletions(-) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 1852d0321..96fed0d93 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -124,12 +124,13 @@ OUTPUT: max_electron_sim_time; io_electron=io_electron, initial_time=initial_time, residual_tolerance=residual_tolerance, evolve_ppar=evolve_ppar, ion_dt=ion_dt) elseif solution_method == "backward_euler" - return electron_backward_euler!(scratch, pdf, moments, phi, collisions, - composition, r, z, vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, - z_advect, vpa_advect, scratch_dummy, t_params, external_source_settings, - num_diss_params, nl_solver_params, max_electron_pdf_iterations, - max_electron_sim_time; io_electron=io_electron, initial_time=initial_time, - residual_tolerance=residual_tolerance, evolve_ppar=evolve_ppar, ion_dt=ion_dt) + return electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, + collisions, composition, r, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, t_params, + external_source_settings, num_diss_params, nl_solver_params, + max_electron_pdf_iterations, max_electron_sim_time; io_electron=io_electron, + initial_time=initial_time, residual_tolerance=residual_tolerance, + evolve_ppar=evolve_ppar, ion_dt=ion_dt) elseif solution_method == "shooting_method" dens = moments.electron.dens vthe = moments.electron.vth @@ -642,15 +643,16 @@ advance of the electron kinetic equation until a steady-state solution is reache Note that this function does not use the [`runge_kutta`](@ref) timestep functionality. `t_params.previous_dt[]` is used to store the (adaptively updated) initial timestep of the pseudotimestepping loop (initial value of `t_params.dt[]` within -`electron_backward_euler!()`). `t_params.dt[]` is adapted according to the iteration -counts of the Newton solver. +`electron_backward_euler_pseudotimestepping!()`). `t_params.dt[]` is adapted according to +the iteration counts of the Newton solver. """ -function electron_backward_euler!(scratch, pdf, moments, phi, collisions, composition, r, - z, vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, z_advect, vpa_advect, - scratch_dummy, t_params, external_source_settings, num_diss_params, - nl_solver_params, max_electron_pdf_iterations, max_electron_sim_time; - io_electron=nothing, initial_time=nothing, residual_tolerance=nothing, - evolve_ppar=false, ion_dt=nothing) +function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, + collisions, composition, r, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, t_params, + external_source_settings, num_diss_params, nl_solver_params, + max_electron_pdf_iterations, max_electron_sim_time; io_electron=nothing, + initial_time=nothing, residual_tolerance=nothing, evolve_ppar=false, + ion_dt=nothing) if max_electron_pdf_iterations === nothing && max_electron_sim_time === nothing error("Must set one of max_electron_pdf_iterations and max_electron_sim_time") @@ -799,751 +801,35 @@ function electron_backward_euler!(scratch, pdf, moments, phi, collisions, compos end end - # Calculate heat flux and derivatives using updated f_electron - @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], - electron_ppar_new, - moments.electron.vth[:,ir], - f_electron_new, vpa, ir) - @views calculate_electron_moment_derivatives_no_r!( - moments, - (electron_density=moments.electron.dens[:,ir], - electron_upar=moments.electron.upar[:,ir], - electron_ppar=electron_ppar_new), - scratch_dummy, z, z_spectral, - num_diss_params.electron.moment_dissipation_coefficient, ir) - - if nl_solver_params.preconditioner_type === Val(:electron_split_lu) - if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval - nl_solver_params.solves_since_precon_update[] = 0 - - vth = @view moments.electron.vth[:,ir] - me = composition.me_over_mi - dens = @view moments.electron.dens[:,ir] - upar = @view moments.electron.upar[:,ir] - ppar = electron_ppar_new - ddens_dz = @view moments.electron.ddens_dz[:,ir] - dupar_dz = @view moments.electron.dupar_dz[:,ir] - dppar_dz = @view moments.electron.dppar_dz[:,ir] - dvth_dz = @view moments.electron.dvth_dz[:,ir] - dqpar_dz = @view moments.electron.dqpar_dz[:,ir] - source_amplitude = moments.electron.external_source_amplitude - source_density_amplitude = moments.electron.external_source_density_amplitude - source_momentum_amplitude = moments.electron.external_source_momentum_amplitude - source_pressure_amplitude = moments.electron.external_source_pressure_amplitude - - # Note the region(s) used here must be the same as the region(s) used - # when the matrices are used in `split_precon!()`, so that the - # parallelisation is the same and each matrix is used on the same - # process that created it. - - # z-advection preconditioner - begin_vperp_vpa_region() - update_electron_speed_z!(z_advect[1], upar, vth, vpa.grid, ir) - @loop_vperp_vpa ivperp ivpa begin - z_matrix, ppar_matrix = get_electron_split_Jacobians!( - ivperp, ivpa, ppar, moments, collisions, composition, z, - vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, - z_advect, vpa_advect, scratch_dummy, - external_source_settings, num_diss_params, t_params, ion_dt, - ir, evolve_ppar) - @timeit_debug global_timer "lu" nl_solver_params.preconditioners.z[ivpa,ivperp,ir] = lu(sparse(z_matrix)) - if ivperp == 1 && ivpa == 1 - @timeit_debug global_timer "lu" nl_solver_params.preconditioners.ppar[ir] = lu(sparse(ppar_matrix)) - end - end - end - - function split_precon!(x) - precon_ppar, precon_f = x - - begin_vperp_vpa_region() - @loop_vperp_vpa ivperp ivpa begin - z_precon_matrix = nl_solver_params.preconditioners.z[ivpa,ivperp,ir] - f_slice = @view precon_f[ivpa,ivperp,:] - @views z.scratch .= f_slice - @timeit_debug global_timer "ldiv!" ldiv!(z.scratch2, z_precon_matrix, z.scratch) - f_slice .= z.scratch2 - end - - begin_z_region() - ppar_precon_matrix = nl_solver_params.preconditioners.ppar[ir] - @loop_z iz begin - z.scratch[iz] = precon_ppar[iz] - end - - begin_serial_region() - @serial_region begin - @timeit_debug global_timer "ldiv!" ldiv!(precon_ppar, ppar_precon_matrix, z.scratch) - end - end - - left_preconditioner = identity - right_preconditioner = split_precon! - elseif nl_solver_params.preconditioner_type === Val(:electron_lu) - - if t_params.dt[] > 1.5 * nl_solver_params.precon_dt[] || - t_params.dt[] < 2.0/3.0 * nl_solver_params.precon_dt[] - - # dt has changed significantly, so update the preconditioner - nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval - end - - if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval -global_rank[] == 0 && println("recalculating precon") - nl_solver_params.solves_since_precon_update[] = 0 - nl_solver_params.precon_dt[] = t_params.dt[] - - orig_lu, precon_matrix, input_buffer, output_buffer = - nl_solver_params.preconditioners[ir] - - fill_electron_kinetic_equation_Jacobian!( - precon_matrix, f_electron_new, electron_ppar_new, moments, phi, - collisions, composition, z, vperp, vpa, z_spectral, - vperp_spectral, vpa_spectral, z_advect, vpa_advect, scratch_dummy, - external_source_settings, num_diss_params, t_params, ion_dt, - ir, evolve_ppar) - - begin_serial_region() - if block_rank[] == 0 - if size(orig_lu) == (1, 1) - # Have not properly created the LU decomposition before, so - # cannot reuse it. - @timeit_debug global_timer "lu" nl_solver_params.preconditioners[ir] = - (lu(sparse(precon_matrix)), precon_matrix, input_buffer, - output_buffer) - else - # LU decomposition was previously created. The Jacobian always - # has the same sparsity pattern, so by using `lu!()` we can - # reuse some setup. - try - @timeit_debug global_timer "lu!" lu!(orig_lu, sparse(precon_matrix); check=false) - catch e - if !isa(e, ArgumentError) - rethrow(e) - end - println("Sparsity pattern of matrix changed, rebuilding " - * " LU from scratch") - @timeit_debug global_timer "lu" orig_lu = lu(sparse(precon_matrix)) - end - nl_solver_params.preconditioners[ir] = - (orig_lu, precon_matrix, input_buffer, output_buffer) - end - else - nl_solver_params.preconditioners[ir] = - (orig_lu, precon_matrix, input_buffer, output_buffer) - end - end - - - @timeit_debug global_timer lu_precon!(x) = begin - precon_ppar, precon_f = x - - precon_lu, _, this_input_buffer, this_output_buffer = - nl_solver_params.preconditioners[ir] - - begin_serial_region() - counter = 1 - @loop_z_vperp_vpa iz ivperp ivpa begin - this_input_buffer[counter] = precon_f[ivpa,ivperp,iz] - counter += 1 - end - @loop_z iz begin - this_input_buffer[counter] = precon_ppar[iz] - counter += 1 - end - - begin_serial_region() - @serial_region begin - @timeit_debug global_timer "ldiv!" ldiv!(this_output_buffer, precon_lu, this_input_buffer) - end - - begin_serial_region() - counter = 1 - @loop_z_vperp_vpa iz ivperp ivpa begin - precon_f[ivpa,ivperp,iz] = this_output_buffer[counter] - counter += 1 - end - @loop_z iz begin - precon_ppar[iz] = this_output_buffer[counter] - counter += 1 - end - - # Ensure values of precon_f and precon_ppar are consistent across - # distributed-MPI block boundaries. For precon_f take the upwind - # value, and for precon_ppar take the average. - f_lower_endpoints = @view scratch_dummy.buffer_vpavperpr_1[:,:,ir] - f_upper_endpoints = @view scratch_dummy.buffer_vpavperpr_2[:,:,ir] - receive_buffer1 = @view scratch_dummy.buffer_vpavperpr_3[:,:,ir] - receive_buffer2 = @view scratch_dummy.buffer_vpavperpr_4[:,:,ir] - begin_vperp_vpa_region() - @loop_vperp_vpa ivperp ivpa begin - f_lower_endpoints[ivpa,ivperp] = precon_f[ivpa,ivperp,1] - f_upper_endpoints[ivpa,ivperp] = precon_f[ivpa,ivperp,end] - end - # We upwind the z-derivatives in `electron_z_advection!()`, so would - # expect that upwinding the results here in z would make sense. - # However, upwinding here makes convergence much slower (~10x), - # compared to picking the values from one side or other of the block - # boundary, or taking the average of the values on either side. - # Neither direction is special, so taking the average seems most - # sensible (although in an intial test it does not seem to converge - # faster than just picking one or the other). - # Maybe this could indicate that it is more important to have a fully - # self-consistent Jacobian inversion for the - # `electron_vpa_advection()` part rather than taking half(ish) of the - # values from one block and the other half(ish) from the other. - reconcile_element_boundaries_MPI_z_pdf_vpavperpz!( - precon_f, f_lower_endpoints, f_upper_endpoints, receive_buffer1, - receive_buffer2, z) - - begin_serial_region() - @serial_region begin - buffer_1[] = precon_ppar[1] - buffer_2[] = precon_ppar[end] - end - reconcile_element_boundaries_MPI!( - precon_ppar, buffer_1, buffer_2, buffer_3, buffer_4, z) - - return nothing - end - - left_preconditioner = identity - right_preconditioner = lu_precon! - elseif nl_solver_params.preconditioner_type === Val(:electron_adi) - - if t_params.dt[] > 1.5 * nl_solver_params.precon_dt[] || - t_params.dt[] < 2.0/3.0 * nl_solver_params.precon_dt[] - - # dt has changed significantly, so update the preconditioner - nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval - end - - if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval -global_rank[] == 0 && println("recalculating precon") - nl_solver_params.solves_since_precon_update[] = 0 - nl_solver_params.precon_dt[] = t_params.dt[] - - adi_info = nl_solver_params.preconditioners[ir] - - dens = @view moments.electron.dens[:,ir] - upar = @view moments.electron.upar[:,ir] - vth = @view moments.electron.vth[:,ir] - qpar = @view moments.electron.qpar[:,ir] - - # Reconstruct w_∥^3 moment of g_e from already-calculated qpar - third_moment = scratch_dummy.buffer_z_1 - dthird_moment_dz = scratch_dummy.buffer_z_2 - begin_z_region() - @loop_z iz begin - third_moment[iz] = 0.5 * qpar[iz] / electron_ppar_new[iz] / vth[iz] - end - derivative_z!(dthird_moment_dz, third_moment, buffer_1, buffer_2, - buffer_3, buffer_4, z_spectral, z) - - z_speed = @view z_advect[1].speed[:,:,:,ir] - - dpdf_dz = @view scratch_dummy.buffer_vpavperpzr_1[:,:,:,ir] - begin_vperp_vpa_region() - update_electron_speed_z!(z_advect[1], upar, vth, vpa.grid, ir) - @loop_vperp_vpa ivperp ivpa begin - @views z_advect[1].adv_fac[:,ivpa,ivperp,ir] = -z_speed[:,ivpa,ivperp] - end - #calculate the upwind derivative - @views derivative_z_pdf_vpavperpz!(dpdf_dz, f_electron_new, - z_advect[1].adv_fac[:,:,:,ir], - scratch_dummy.buffer_vpavperpr_1[:,:,ir], - scratch_dummy.buffer_vpavperpr_2[:,:,ir], - scratch_dummy.buffer_vpavperpr_3[:,:,ir], - scratch_dummy.buffer_vpavperpr_4[:,:,ir], - scratch_dummy.buffer_vpavperpr_5[:,:,ir], - scratch_dummy.buffer_vpavperpr_6[:,:,ir], - z_spectral, z) - - dpdf_dvpa = @view scratch_dummy.buffer_vpavperpzr_2[:,:,:,ir] - begin_z_vperp_region() - update_electron_speed_vpa!(vpa_advect[1], dens, upar, - electron_ppar_new, moments, vpa.grid, - external_source_settings.electron, ir) - @loop_z_vperp iz ivperp begin - @views @. vpa_advect[1].adv_fac[:,ivperp,iz,ir] = -vpa_advect[1].speed[:,ivperp,iz,ir] - end - #calculate the upwind derivative of the electron pdf w.r.t. wpa - @loop_z_vperp iz ivperp begin - @views derivative!(dpdf_dvpa[:,ivperp,iz], f_electron_new[:,ivperp,iz], vpa, - vpa_advect[1].adv_fac[:,ivperp,iz,ir], vpa_spectral) - end - - zeroth_moment = z.scratch_shared - first_moment = z.scratch_shared2 - second_moment = z.scratch_shared3 - begin_z_region() - vpa_grid = vpa.grid - vpa_wgts = vpa.wgts - @loop_z iz begin - @views zeroth_moment[iz] = integrate_over_vspace(f_electron_new[:,1,iz], vpa_wgts) - @views first_moment[iz] = integrate_over_vspace(f_electron_new[:,1,iz], vpa_grid, vpa_wgts) - @views second_moment[iz] = integrate_over_vspace(f_electron_new[:,1,iz], vpa_grid, 2, vpa_wgts) - end - - v_size = vperp.n * vpa.n - - # Do setup for 'v solves' - v_solve_counter = 0 - A = adi_info.v_solve_matrix_buffer - explicit_J = adi_info.J_buffer - # Get sparse matrix for explicit, right-hand-side part of the - # solve. - if adi_info.n_extra_iterations > 0 - # If we only do one 'iteration' we don't need the 'explicit - # matrix' for the first solve (the v-solve), because the initial - # guess is zero, - fill_electron_kinetic_equation_Jacobian!( - explicit_J, f_electron_new, electron_ppar_new, moments, - phi, collisions, composition, z, vperp, vpa, z_spectral, - vperp_spectral, vpa_spectral, z_advect, vpa_advect, - scratch_dummy, external_source_settings, num_diss_params, - t_params, ion_dt, ir, evolve_ppar, :explicit_z, false) - end - begin_z_region() - @loop_z iz begin - v_solve_counter += 1 - # Get LU-factorized matrix for implicit part of the solve - @views fill_electron_kinetic_equation_v_only_Jacobian!( - A, f_electron_new[:,:,iz], electron_ppar_new[iz], - dpdf_dz[:,:,iz], dpdf_dvpa[:,:,iz], z_speed, moments, - zeroth_moment[iz], first_moment[iz], second_moment[iz], - third_moment[iz], dthird_moment_dz[iz], phi[iz], collisions, - composition, z, vperp, vpa, z_spectral, vperp_spectral, - vpa_spectral, z_advect, vpa_advect, scratch_dummy, - external_source_settings, num_diss_params, t_params, ion_dt, - ir, iz, evolve_ppar) - A_sparse = sparse(A) - if !isassigned(adi_info.v_solve_implicit_lus, v_solve_counter) - @timeit_debug global_timer "lu" adi_info.v_solve_implicit_lus[v_solve_counter] = lu(A_sparse) - else - # LU decomposition was previously created. The Jacobian always - # has the same sparsity pattern, so by using `lu!()` we can - # reuse some setup. - try - @timeit_debug global_timer "lu!" lu!(adi_info.v_solve_implicit_lus[v_solve_counter], A_sparse; check=false) - catch e - if !isa(e, ArgumentError) - rethrow(e) - end - println("Sparsity pattern of matrix changed, rebuilding " - * " LU from scratch ir=$ir, iz=$iz") - @timeit_debug global_timer "lu" adi_info.v_solve_implicit_lus[v_solve_counter] = lu(A_sparse) - end - end - - if adi_info.n_extra_iterations > 0 - # If we only do one 'iteration' we don't need the 'explicit - # matrix' for the first solve (the v-solve), because the - # initial guess is zero, - adi_info.v_solve_explicit_matrices[v_solve_counter] = sparse(@view(explicit_J[adi_info.v_solve_global_inds[v_solve_counter],:])) - end - end - @boundscheck v_solve_counter == adi_info.v_solve_nsolve || error("v_solve_counter($v_solve_counter) != v_solve_nsolve($(adi_info.v_solve_nsolve))") - - # Do setup for 'z solves' - z_solve_counter = 0 - A = adi_info.z_solve_matrix_buffer - explicit_J = adi_info.J_buffer - # Get sparse matrix for explicit, right-hand-side part of the - # solve. - fill_electron_kinetic_equation_Jacobian!( - explicit_J, f_electron_new, electron_ppar_new, moments, phi, - collisions, composition, z, vperp, vpa, z_spectral, - vperp_spectral, vpa_spectral, z_advect, vpa_advect, scratch_dummy, - external_source_settings, num_diss_params, t_params, ion_dt, ir, - evolve_ppar, :explicit_v, false) - begin_vperp_vpa_region() - @loop_vperp_vpa ivperp ivpa begin - z_solve_counter += 1 - - # Get LU-factorized matrix for implicit part of the solve - @views fill_electron_kinetic_equation_z_only_Jacobian_f!( - A, f_electron_new[ivpa,ivperp,:], electron_ppar_new, - dpdf_dz[ivpa,ivperp,:], dpdf_dvpa[ivpa,ivperp,:], z_speed, - moments, zeroth_moment, first_moment, second_moment, - third_moment, dthird_moment_dz, collisions, composition, z, - vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, - z_advect, vpa_advect, scratch_dummy, external_source_settings, - num_diss_params, t_params, ion_dt, ir, ivperp, ivpa, - evolve_ppar) - - A_sparse = sparse(A) - if !isassigned(adi_info.z_solve_implicit_lus, z_solve_counter) - @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) - else - # LU decomposition was previously created. The Jacobian always - # has the same sparsity pattern, so by using `lu!()` we can - # reuse some setup. - try - @timeit_debug global_timer "lu!" lu!(adi_info.z_solve_implicit_lus[z_solve_counter], A_sparse; check=false) - catch e - if !isa(e, ArgumentError) - rethrow(e) - end - println("Sparsity pattern of matrix changed, rebuilding " - * " LU from scratch ir=$ir, ivperp=$ivperp, ivpa=$ivpa") - @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) - end - end - - adi_info.z_solve_explicit_matrices[z_solve_counter] = sparse(@view(explicit_J[adi_info.z_solve_global_inds[z_solve_counter],:])) - end - begin_serial_region(; no_synchronize=true) - @serial_region begin - # Do the solve for ppar on the rank-0 process, which has the - # fewest grid points to handle if there are not an exactly equal - # number of points for each process. - z_solve_counter += 1 - - # Get LU-factorized matrix for implicit part of the solve - @views fill_electron_kinetic_equation_z_only_Jacobian_ppar!( - A, electron_ppar_new, moments, zeroth_moment, first_moment, - second_moment, third_moment, dthird_moment_dz, collisions, - composition, z, vperp, vpa, z_spectral, vperp_spectral, - vpa_spectral, z_advect, vpa_advect, scratch_dummy, - external_source_settings, num_diss_params, t_params, ion_dt, - ir, evolve_ppar) - - A_sparse = sparse(A) - if !isassigned(adi_info.z_solve_implicit_lus, z_solve_counter) - @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) - else - # LU decomposition was previously created. The Jacobian always - # has the same sparsity pattern, so by using `lu!()` we can - # reuse some setup. - try - @timeit_debug global_timer "lu!" lu!(adi_info.z_solve_implicit_lus[z_solve_counter], A_sparse; check=false) - catch e - if !isa(e, ArgumentError) - rethrow(e) - end - println("Sparsity pattern of matrix changed, rebuilding " - * " LU from scratch ir=$ir, ppar z-solve") - @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) - end - end - - adi_info.z_solve_explicit_matrices[z_solve_counter] = sparse(@view(explicit_J[adi_info.z_solve_global_inds[z_solve_counter],:])) - end - @boundscheck z_solve_counter == adi_info.z_solve_nsolve || error("z_solve_counter($z_solve_counter) != z_solve_nsolve($(adi_info.z_solve_nsolve))") - end - - @timeit_debug global_timer adi_precon!(x) = begin - precon_ppar, precon_f = x - - adi_info = nl_solver_params.preconditioners[ir] - precon_iterations = nl_solver_params.precon_iterations - this_input_buffer = adi_info.input_buffer - this_intermediate_buffer = adi_info.intermediate_buffer - this_output_buffer = adi_info.output_buffer - global_index_subrange = adi_info.global_index_subrange - n_extra_iterations = adi_info.n_extra_iterations - - v_size = vperp.n * vpa.n - pdf_size = z.n * v_size - - # Use these views to communicate block-boundary points - output_buffer_pdf_view = reshape(@view(this_output_buffer[1:pdf_size]), size(precon_f)) - output_buffer_ppar_view = @view(this_output_buffer[pdf_size+1:end]) - f_lower_endpoints = @view scratch_dummy.buffer_vpavperpr_1[:,:,ir] - f_upper_endpoints = @view scratch_dummy.buffer_vpavperpr_2[:,:,ir] - receive_buffer1 = @view scratch_dummy.buffer_vpavperpr_3[:,:,ir] - receive_buffer2 = @view scratch_dummy.buffer_vpavperpr_4[:,:,ir] - - function adi_communicate_boundary_points() - # Ensure values of precon_f and precon_ppar are consistent across - # distributed-MPI block boundaries. For precon_f take the upwind - # value, and for precon_ppar take the average. - begin_vperp_vpa_region() - @loop_vperp_vpa ivperp ivpa begin - f_lower_endpoints[ivpa,ivperp] = output_buffer_pdf_view[ivpa,ivperp,1] - f_upper_endpoints[ivpa,ivperp] = output_buffer_pdf_view[ivpa,ivperp,end] - end - # We upwind the z-derivatives in `electron_z_advection!()`, so would - # expect that upwinding the results here in z would make sense. - # However, upwinding here makes convergence much slower (~10x), - # compared to picking the values from one side or other of the block - # boundary, or taking the average of the values on either side. - # Neither direction is special, so taking the average seems most - # sensible (although in an intial test it does not seem to converge - # faster than just picking one or the other). - # Maybe this could indicate that it is more important to have a fully - # self-consistent Jacobian inversion for the - # `electron_vpa_advection()` part rather than taking half(ish) of the - # values from one block and the other half(ish) from the other. - reconcile_element_boundaries_MPI_z_pdf_vpavperpz!( - output_buffer_pdf_view, f_lower_endpoints, f_upper_endpoints, receive_buffer1, - receive_buffer2, z) - - begin_serial_region() - @serial_region begin - buffer_1[] = output_buffer_ppar_view[1] - buffer_2[] = output_buffer_ppar_view[end] - end - reconcile_element_boundaries_MPI!( - output_buffer_ppar_view, buffer_1, buffer_2, buffer_3, buffer_4, z) - - return nothing - end - - begin_z_vperp_vpa_region() - @loop_z_vperp_vpa iz ivperp ivpa begin - row = (iz - 1)*v_size + (ivperp - 1)*vpa.n + ivpa - this_input_buffer[row] = precon_f[ivpa,ivperp,iz] - end - begin_z_region() - @loop_z iz begin - row = pdf_size + iz - this_input_buffer[row] = precon_ppar[iz] - end - _block_synchronize() - - # Use this to copy current guess from output_buffer to - # intermediate_buffer, to avoid race conditions as new guess is - # written into output_buffer. - function fill_intermediate_buffer!() - _block_synchronize() - for i ∈ global_index_subrange - this_intermediate_buffer[i] = this_output_buffer[i] - end - _block_synchronize() - end - - v_solve_global_inds = adi_info.v_solve_global_inds - v_solve_nsolve = adi_info.v_solve_nsolve - v_solve_implicit_lus = adi_info.v_solve_implicit_lus - v_solve_explicit_matrices = adi_info.v_solve_explicit_matrices - v_solve_buffer = adi_info.v_solve_buffer - v_solve_buffer2 = adi_info.v_solve_buffer2 - function first_adi_v_solve!() - # The initial guess is all-zero, so for the first solve there is - # no need to multiply by the 'explicit matrix' as x==0, so E.x==0 - for isolve ∈ 1:v_solve_nsolve - this_inds = v_solve_global_inds[isolve] - v_solve_buffer .= this_input_buffer[this_inds] - @timeit_debug global_timer "ldiv!" ldiv!(v_solve_buffer2, v_solve_implicit_lus[isolve], v_solve_buffer) - this_output_buffer[this_inds] .= v_solve_buffer2 - end - end - function adi_v_solve!() - for isolve ∈ 1:v_solve_nsolve - this_inds = v_solve_global_inds[isolve] - v_solve_buffer .= @view this_input_buffer[this_inds] - # Need to multiply the 'explicit matrix' by -1, because all - # the Jacobian-calculation functions are defined as if the - # terms are being added to the left-hand-side preconditioner - # matrix, but here the 'explicit matrix' terms are added on - # the right-hand-side. - @timeit_debug global_timer "mul!" mul!(v_solve_buffer, v_solve_explicit_matrices[isolve], - this_intermediate_buffer, -1.0, 1.0) - @timeit_debug global_timer "ldiv!" ldiv!(v_solve_buffer2, v_solve_implicit_lus[isolve], v_solve_buffer) - this_output_buffer[this_inds] .= v_solve_buffer2 - end - end - - z_solve_global_inds = adi_info.z_solve_global_inds - z_solve_nsolve = adi_info.z_solve_nsolve - z_solve_implicit_lus = adi_info.z_solve_implicit_lus - z_solve_explicit_matrices = adi_info.z_solve_explicit_matrices - z_solve_buffer = adi_info.z_solve_buffer - z_solve_buffer2 = adi_info.z_solve_buffer2 - function adi_z_solve!() - for isolve ∈ 1:z_solve_nsolve - this_inds = z_solve_global_inds[isolve] - z_solve_buffer .= @view this_input_buffer[this_inds] - # Need to multiply the 'explicit matrix' by -1, because all - # the Jacobian-calculation functions are defined as if the - # terms are being added to the left-hand-side preconditioner - # matrix, but here the 'explicit matrix' terms are added on - # the right-hand-side. - @timeit_debug global_timer "mul!" mul!(z_solve_buffer, z_solve_explicit_matrices[isolve], this_intermediate_buffer, -1.0, 1.0) - @timeit_debug global_timer "ldiv!" ldiv!(z_solve_buffer2, z_solve_implicit_lus[isolve], z_solve_buffer) - this_output_buffer[this_inds] .= z_solve_buffer2 - end - end - - precon_iterations[] += 1 - first_adi_v_solve!() - fill_intermediate_buffer!() - adi_z_solve!() - adi_communicate_boundary_points() - - for n ∈ 1:n_extra_iterations - precon_iterations[] += 1 - fill_intermediate_buffer!() - adi_v_solve!() - fill_intermediate_buffer!() - adi_z_solve!() - adi_communicate_boundary_points() - end - - # Unpack preconditioner solution - begin_z_vperp_vpa_region() - @loop_z_vperp_vpa iz ivperp ivpa begin - row = (iz - 1)*v_size + (ivperp - 1)*vpa.n + ivpa - precon_f[ivpa,ivperp,iz] = this_output_buffer[row] - end - begin_z_region() - @loop_z iz begin - row = pdf_size + iz - precon_ppar[iz] = this_output_buffer[row] - end - - return nothing - end - - left_preconditioner = identity - right_preconditioner = adi_precon! - elseif nl_solver_params.preconditioner_type === Val(:none) - left_preconditioner = identity - right_preconditioner = identity - else - error("preconditioner_type=$(nl_solver_params.preconditioner_type) is not " - * "supported by electron_backward_euler!().") - end - - # Do a backward-Euler update of the electron pdf, and (if evove_ppar=true) the - # electron parallel pressure. - function residual_func!(this_residual, new_variables; krylov=false) - electron_ppar_residual, f_electron_residual = this_residual - electron_ppar_newvar, f_electron_newvar = new_variables - - if evolve_ppar - this_dens = moments.electron.dens - this_upar = moments.electron.upar - this_vth = moments.electron.vth - begin_z_region() - @loop_z iz begin - # update the electron thermal speed using the updated electron - # parallel pressure - this_vth[iz,ir] = sqrt(abs(2.0 * electron_ppar_newvar[iz] / - (this_dens[iz,ir] * - composition.me_over_mi))) - end - end - - # enforce the boundary condition(s) on the electron pdf - @views enforce_boundary_condition_on_electron_pdf!( - f_electron_newvar, phi, moments.electron.vth[:,ir], - moments.electron.upar[:,ir], z, vperp, vpa, vperp_spectral, - vpa_spectral, vpa_advect, moments, - num_diss_params.electron.vpa_dissipation_coefficient > 0.0, - composition.me_over_mi, ir; bc_constraints=false, - update_vcut=!krylov) - - if evolve_ppar - # Calculate heat flux and derivatives using new_variables + step_success = electron_backward_euler!( + old_scratch, new_scratch, moments, phi, collisions, + composition, r, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, + t_params, external_source_settings, num_diss_params, + nl_solver_params, ir; evolve_ppar=evolve_ppar, + ion_dt=ion_dt) + + if step_success + apply_electron_bc_and_constraints_no_r!(f_electron_new, phi, moments, r, + z, vperp, vpa, vperp_spectral, + vpa_spectral, vpa_advect, + num_diss_params, composition, ir, + nl_solver_params) + + if !evolve_ppar + # update the electron heat flux + moments.electron.qpar_updated[] = false @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], - electron_ppar_newvar, + electron_ppar_new, moments.electron.vth[:,ir], - f_electron_newvar, vpa, - ir) + f_electron_new, vpa, ir) - calculate_electron_moment_derivatives_no_r!( - moments, - (electron_density=this_dens, - electron_upar=this_upar, - electron_ppar=electron_ppar_newvar), - scratch_dummy, z, z_spectral, - num_diss_params.electron.moment_dissipation_coefficient, ir) - else - # Calculate heat flux and derivatives using new_variables - @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], - electron_ppar_newvar, - moments.electron.vth[:,ir], - f_electron_newvar, vpa, - ir) # compute the z-derivative of the parallel electron heat flux @views derivative_z!(moments.electron.dqpar_dz[:,ir], moments.electron.qpar[:,ir], buffer_1, buffer_2, buffer_3, buffer_4, z_spectral, z) end - if evolve_ppar - begin_z_region() - @loop_z iz begin - electron_ppar_residual[iz] = electron_ppar_old[iz,ir] - end - else - begin_z_region() - @loop_z iz begin - electron_ppar_residual[iz] = 0.0 - end - end - - # electron_kinetic_equation_euler_update!() just adds dt*d(g_e)/dt to the - # electron_pdf member of the first argument, so if we set the electron_pdf member - # of the first argument to zero, and pass dt=1, then it will evaluate the time - # derivative, which is the residual for a steady-state solution. - begin_z_vperp_vpa_region() - @loop_z_vperp_vpa iz ivperp ivpa begin - f_electron_residual[ivpa,ivperp,iz] = f_electron_old[ivpa,ivperp,iz] - end - electron_kinetic_equation_euler_update!( - f_electron_residual, electron_ppar_residual, f_electron_newvar, - electron_ppar_newvar, moments, z, vperp, vpa, z_spectral, - vpa_spectral, z_advect, vpa_advect, scratch_dummy, collisions, - composition, external_source_settings, num_diss_params, t_params, - ir; evolve_ppar=evolve_ppar, ion_dt=ion_dt, - soft_force_constraints=true) - - # Now - # residual = f_electron_old + dt*RHS(f_electron_newvar) - # so update to desired residual - begin_z_vperp_vpa_region() - @loop_z_vperp_vpa iz ivperp ivpa begin - f_electron_residual[ivpa,ivperp,iz] = f_electron_newvar[ivpa,ivperp,iz] - f_electron_residual[ivpa,ivperp,iz] - end - if evolve_ppar - begin_z_region() - @loop_z iz begin - electron_ppar_residual[iz] = electron_ppar_newvar[iz] - electron_ppar_residual[iz] - end - end - - # Set residual to zero where pdf_electron is determined by boundary conditions. - if vpa.n > 1 - begin_z_vperp_region() - @loop_z_vperp iz ivperp begin - @views enforce_v_boundary_condition_local!(f_electron_residual[:,ivperp,iz], vpa.bc, - vpa_advect[1].speed[:,ivperp,iz,ir], - num_diss_params.electron.vpa_dissipation_coefficient > 0.0, - vpa, vpa_spectral) - end - end - if vperp.n > 1 - begin_z_vpa_region() - enforce_vperp_boundary_condition!(f_electron_residual, vperp.bc, - vperp, vperp_spectral, vperp_adv, - vperp_diffusion, ir) - end - zero_z_boundary_condition_points(f_electron_residual, z, vpa, moments, ir) - - return nothing - end - - residual = (scratch_dummy.implicit_buffer_z_1, scratch_dummy.implicit_buffer_vpavperpz_1) - delta_x = (scratch_dummy.implicit_buffer_z_2, - scratch_dummy.implicit_buffer_vpavperpz_2) - rhs_delta = (scratch_dummy.implicit_buffer_z_3, - scratch_dummy.implicit_buffer_vpavperpz_3) - v = (scratch_dummy.implicit_buffer_z_4, - scratch_dummy.implicit_buffer_vpavperpz_4) - w = (scratch_dummy.implicit_buffer_z_5, - scratch_dummy.implicit_buffer_vpavperpz_5) - - newton_success = newton_solve!((electron_ppar_new, f_electron_new), - residual_func!, residual, delta_x, rhs_delta, - v, w, nl_solver_params; - left_preconditioner=left_preconditioner, - right_preconditioner=right_preconditioner, - coords=(z=z, vperp=vperp, vpa=vpa)) - if newton_success #println("Newton its ", nl_solver_params.max_nonlinear_iterations_this_step[], " ", t_params.dt[]) # update the time following the pdf update t_params.t[] += t_params.dt[] @@ -1620,75 +906,32 @@ global_rank[] == 0 && println("recalculating precon") @loop_z iz begin electron_ppar_new[iz] = electron_ppar_old[iz] end - end - new_lowerz_vcut_inds = r.scratch_shared_int - new_upperz_vcut_inds = r.scratch_shared_int2 - apply_electron_bc_and_constraints_no_r!(f_electron_new, phi, moments, z, - vperp, vpa, vperp_spectral, - vpa_spectral, vpa_advect, - num_diss_params, composition, ir; - lowerz_vcut_inds=new_lowerz_vcut_inds, - upperz_vcut_inds=new_upperz_vcut_inds) - # Check if either vcut_ind has changed - if either has, recalculate the - # preconditioner because the response at the grid point before the cutoff is - # sharp, so the preconditioner could be significantly wrong when it was - # calculated using the wrong vcut_ind. - lower_vcut_changed = @view z.scratch_shared_int[1:1] - upper_vcut_changed = @view z.scratch_shared_int[2:2] - @serial_region begin - if z.irank == 0 - precon_lowerz_vcut_inds = nl_solver_params.precon_lowerz_vcut_inds - if all(new_lowerz_vcut_inds .== precon_lowerz_vcut_inds) - lower_vcut_changed[] = 0 - else - lower_vcut_changed[] = 1 - precon_lowerz_vcut_inds .= new_lowerz_vcut_inds - end - end - MPI.Bcast!(lower_vcut_changed, comm_inter_block[]; root=0) - #req1 = MPI.Ibcast!(lower_vcut_changed, comm_inter_block[]; root=0) + new_lowerz_vcut_ind = @view r.scratch_shared_int[ir:ir] + new_upperz_vcut_ind = @view r.scratch_shared_int2[ir:ir] + apply_electron_bc_and_constraints_no_r!(f_electron_new, phi, moments, r, + z, vperp, vpa, vperp_spectral, + vpa_spectral, vpa_advect, + num_diss_params, composition, ir, + nl_solver_params) + + if !evolve_ppar + # update the electron heat flux + moments.electron.qpar_updated[] = false + @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], + electron_ppar_new, + moments.electron.vth[:,ir], + f_electron_new, vpa, ir) - if z.irank == z.nrank - 1 - precon_upperz_vcut_inds = nl_solver_params.precon_upperz_vcut_inds - if all(new_upperz_vcut_inds .== precon_upperz_vcut_inds) - upper_vcut_changed[] = 0 - else - upper_vcut_changed[] = 1 - precon_upperz_vcut_inds .= new_upperz_vcut_inds - end + # compute the z-derivative of the parallel electron heat flux + @views derivative_z!(moments.electron.dqpar_dz[:,ir], + moments.electron.qpar[:,ir], buffer_1, buffer_2, + buffer_3, buffer_4, z_spectral, z) end - MPI.Bcast!(upper_vcut_changed, comm_inter_block[]; root=n_blocks[]-1) - #req2 = MPI.Ibcast!(upper_vcut_changed, comm_inter_block[]; root=n_blocks[]-1) - - # Eventually can use Ibcast!() to make the two broadcasts run - # simultaneously, but need the function to be merged into MPI.jl (see - # https://github.com/JuliaParallel/MPI.jl/pull/882). - #MPI.Waitall([req1, req2]) - end - _block_synchronize() - if lower_vcut_changed[] == 1 || upper_vcut_changed[] == 1 - # One or both of the indices changed for some `ir`, so force the - # preconditioner to be recalculated next time. - nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval - end - - if !evolve_ppar - # update the electron heat flux - moments.electron.qpar_updated[] = false - @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], - electron_ppar_new, - moments.electron.vth[:,ir], - f_electron_new, vpa, ir) - - # compute the z-derivative of the parallel electron heat flux - @views derivative_z!(moments.electron.dqpar_dz[:,ir], - moments.electron.qpar[:,ir], buffer_1, buffer_2, - buffer_3, buffer_4, z_spectral, z) end residual_norm = -1.0 - if newton_success + if step_success # Calculate residuals to decide if iteration is converged. # Might want an option to calculate the r_normesidual only after a certain # number of iterations (especially during initialization when there are @@ -1830,6 +1073,781 @@ global_rank[] == 0 && println("recalculating precon") return success end +""" + electron_backward_euler!(old_scratch, new_scratch, moments, phi, + collisions, composition, r, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, t_params, + external_source_settings, num_diss_params, nl_solver_params, ir; + evolve_ppar=false, ion_dt=nothing) = begin + +Take a single backward euler timestep for the electron shape function \$g_e\$ and parallel +pressure \$p_{e∥}\$. +""" +@timeit global_timer electron_backward_euler!(old_scratch, new_scratch, moments, phi, + collisions, composition, r, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, t_params, + external_source_settings, num_diss_params, nl_solver_params, ir; + evolve_ppar=false, ion_dt=nothing) = begin + + # create several 0D dummy arrays for use in taking derivatives + buffer_1 = @view scratch_dummy.buffer_rs_1[ir,1] + buffer_2 = @view scratch_dummy.buffer_rs_2[ir,1] + buffer_3 = @view scratch_dummy.buffer_rs_3[ir,1] + buffer_4 = @view scratch_dummy.buffer_rs_4[ir,1] + + f_electron_old = @view old_scratch.pdf_electron[:,:,:,ir] + f_electron_new = @view new_scratch.pdf_electron[:,:,:,ir] + electron_ppar_old = @view old_scratch.electron_ppar[:,ir] + electron_ppar_new = @view new_scratch.electron_ppar[:,ir] + + # Calculate heat flux and derivatives using updated f_electron + @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], + electron_ppar_new, + moments.electron.vth[:,ir], + f_electron_new, vpa, ir) + @views calculate_electron_moment_derivatives_no_r!( + moments, + (electron_density=moments.electron.dens[:,ir], + electron_upar=moments.electron.upar[:,ir], + electron_ppar=electron_ppar_new), + scratch_dummy, z, z_spectral, + num_diss_params.electron.moment_dissipation_coefficient, ir) + + if nl_solver_params.preconditioner_type === Val(:electron_split_lu) + if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval + nl_solver_params.solves_since_precon_update[] = 0 + + vth = @view moments.electron.vth[:,ir] + me = composition.me_over_mi + dens = @view moments.electron.dens[:,ir] + upar = @view moments.electron.upar[:,ir] + ppar = electron_ppar_new + ddens_dz = @view moments.electron.ddens_dz[:,ir] + dupar_dz = @view moments.electron.dupar_dz[:,ir] + dppar_dz = @view moments.electron.dppar_dz[:,ir] + dvth_dz = @view moments.electron.dvth_dz[:,ir] + dqpar_dz = @view moments.electron.dqpar_dz[:,ir] + source_amplitude = moments.electron.external_source_amplitude + source_density_amplitude = moments.electron.external_source_density_amplitude + source_momentum_amplitude = moments.electron.external_source_momentum_amplitude + source_pressure_amplitude = moments.electron.external_source_pressure_amplitude + + # Note the region(s) used here must be the same as the region(s) used + # when the matrices are used in `split_precon!()`, so that the + # parallelisation is the same and each matrix is used on the same + # process that created it. + + # z-advection preconditioner + begin_vperp_vpa_region() + update_electron_speed_z!(z_advect[1], upar, vth, vpa.grid, ir) + @loop_vperp_vpa ivperp ivpa begin + z_matrix, ppar_matrix = get_electron_split_Jacobians!( + ivperp, ivpa, ppar, moments, collisions, composition, z, + vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, + z_advect, vpa_advect, scratch_dummy, + external_source_settings, num_diss_params, t_params, ion_dt, + ir, evolve_ppar) + @timeit_debug global_timer "lu" nl_solver_params.preconditioners.z[ivpa,ivperp,ir] = lu(sparse(z_matrix)) + if ivperp == 1 && ivpa == 1 + @timeit_debug global_timer "lu" nl_solver_params.preconditioners.ppar[ir] = lu(sparse(ppar_matrix)) + end + end + end + + function split_precon!(x) + precon_ppar, precon_f = x + + begin_vperp_vpa_region() + @loop_vperp_vpa ivperp ivpa begin + z_precon_matrix = nl_solver_params.preconditioners.z[ivpa,ivperp,ir] + f_slice = @view precon_f[ivpa,ivperp,:] + @views z.scratch .= f_slice + @timeit_debug global_timer "ldiv!" ldiv!(z.scratch2, z_precon_matrix, z.scratch) + f_slice .= z.scratch2 + end + + begin_z_region() + ppar_precon_matrix = nl_solver_params.preconditioners.ppar[ir] + @loop_z iz begin + z.scratch[iz] = precon_ppar[iz] + end + + begin_serial_region() + @serial_region begin + @timeit_debug global_timer "ldiv!" ldiv!(precon_ppar, ppar_precon_matrix, z.scratch) + end + end + + left_preconditioner = identity + right_preconditioner = split_precon! + elseif nl_solver_params.preconditioner_type === Val(:electron_lu) + + if t_params.dt[] > 1.5 * nl_solver_params.precon_dt[] || + t_params.dt[] < 2.0/3.0 * nl_solver_params.precon_dt[] + + # dt has changed significantly, so update the preconditioner + nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval + end + + if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval +global_rank[] == 0 && println("recalculating precon") + nl_solver_params.solves_since_precon_update[] = 0 + nl_solver_params.precon_dt[] = t_params.dt[] + + orig_lu, precon_matrix, input_buffer, output_buffer = + nl_solver_params.preconditioners[ir] + + fill_electron_kinetic_equation_Jacobian!( + precon_matrix, f_electron_new, electron_ppar_new, moments, phi, + collisions, composition, z, vperp, vpa, z_spectral, + vperp_spectral, vpa_spectral, z_advect, vpa_advect, scratch_dummy, + external_source_settings, num_diss_params, t_params, ion_dt, + ir, evolve_ppar) + + begin_serial_region() + if block_rank[] == 0 + if size(orig_lu) == (1, 1) + # Have not properly created the LU decomposition before, so + # cannot reuse it. + @timeit_debug global_timer "lu" nl_solver_params.preconditioners[ir] = + (lu(sparse(precon_matrix)), precon_matrix, input_buffer, + output_buffer) + else + # LU decomposition was previously created. The Jacobian always + # has the same sparsity pattern, so by using `lu!()` we can + # reuse some setup. + try + @timeit_debug global_timer "lu!" lu!(orig_lu, sparse(precon_matrix); check=false) + catch e + if !isa(e, ArgumentError) + rethrow(e) + end + println("Sparsity pattern of matrix changed, rebuilding " + * " LU from scratch") + @timeit_debug global_timer "lu" orig_lu = lu(sparse(precon_matrix)) + end + nl_solver_params.preconditioners[ir] = + (orig_lu, precon_matrix, input_buffer, output_buffer) + end + else + nl_solver_params.preconditioners[ir] = + (orig_lu, precon_matrix, input_buffer, output_buffer) + end + end + + + @timeit_debug global_timer lu_precon!(x) = begin + precon_ppar, precon_f = x + + precon_lu, _, this_input_buffer, this_output_buffer = + nl_solver_params.preconditioners[ir] + + begin_serial_region() + counter = 1 + @loop_z_vperp_vpa iz ivperp ivpa begin + this_input_buffer[counter] = precon_f[ivpa,ivperp,iz] + counter += 1 + end + @loop_z iz begin + this_input_buffer[counter] = precon_ppar[iz] + counter += 1 + end + + begin_serial_region() + @serial_region begin + @timeit_debug global_timer "ldiv!" ldiv!(this_output_buffer, precon_lu, this_input_buffer) + end + + begin_serial_region() + counter = 1 + @loop_z_vperp_vpa iz ivperp ivpa begin + precon_f[ivpa,ivperp,iz] = this_output_buffer[counter] + counter += 1 + end + @loop_z iz begin + precon_ppar[iz] = this_output_buffer[counter] + counter += 1 + end + + # Ensure values of precon_f and precon_ppar are consistent across + # distributed-MPI block boundaries. For precon_f take the upwind + # value, and for precon_ppar take the average. + f_lower_endpoints = @view scratch_dummy.buffer_vpavperpr_1[:,:,ir] + f_upper_endpoints = @view scratch_dummy.buffer_vpavperpr_2[:,:,ir] + receive_buffer1 = @view scratch_dummy.buffer_vpavperpr_3[:,:,ir] + receive_buffer2 = @view scratch_dummy.buffer_vpavperpr_4[:,:,ir] + begin_vperp_vpa_region() + @loop_vperp_vpa ivperp ivpa begin + f_lower_endpoints[ivpa,ivperp] = precon_f[ivpa,ivperp,1] + f_upper_endpoints[ivpa,ivperp] = precon_f[ivpa,ivperp,end] + end + # We upwind the z-derivatives in `electron_z_advection!()`, so would + # expect that upwinding the results here in z would make sense. + # However, upwinding here makes convergence much slower (~10x), + # compared to picking the values from one side or other of the block + # boundary, or taking the average of the values on either side. + # Neither direction is special, so taking the average seems most + # sensible (although in an intial test it does not seem to converge + # faster than just picking one or the other). + # Maybe this could indicate that it is more important to have a fully + # self-consistent Jacobian inversion for the + # `electron_vpa_advection()` part rather than taking half(ish) of the + # values from one block and the other half(ish) from the other. + reconcile_element_boundaries_MPI_z_pdf_vpavperpz!( + precon_f, f_lower_endpoints, f_upper_endpoints, receive_buffer1, + receive_buffer2, z) + + begin_serial_region() + @serial_region begin + buffer_1[] = precon_ppar[1] + buffer_2[] = precon_ppar[end] + end + reconcile_element_boundaries_MPI!( + precon_ppar, buffer_1, buffer_2, buffer_3, buffer_4, z) + + return nothing + end + + left_preconditioner = identity + right_preconditioner = lu_precon! + elseif nl_solver_params.preconditioner_type === Val(:electron_adi) + + if t_params.dt[] > 1.5 * nl_solver_params.precon_dt[] || + t_params.dt[] < 2.0/3.0 * nl_solver_params.precon_dt[] + + # dt has changed significantly, so update the preconditioner + nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval + end + + if nl_solver_params.solves_since_precon_update[] ≥ nl_solver_params.preconditioner_update_interval +global_rank[] == 0 && println("recalculating precon") + nl_solver_params.solves_since_precon_update[] = 0 + nl_solver_params.precon_dt[] = t_params.dt[] + + adi_info = nl_solver_params.preconditioners[ir] + + dens = @view moments.electron.dens[:,ir] + upar = @view moments.electron.upar[:,ir] + vth = @view moments.electron.vth[:,ir] + qpar = @view moments.electron.qpar[:,ir] + + # Reconstruct w_∥^3 moment of g_e from already-calculated qpar + third_moment = scratch_dummy.buffer_z_1 + dthird_moment_dz = scratch_dummy.buffer_z_2 + begin_z_region() + @loop_z iz begin + third_moment[iz] = 0.5 * qpar[iz] / electron_ppar_new[iz] / vth[iz] + end + derivative_z!(dthird_moment_dz, third_moment, buffer_1, buffer_2, + buffer_3, buffer_4, z_spectral, z) + + z_speed = @view z_advect[1].speed[:,:,:,ir] + + dpdf_dz = @view scratch_dummy.buffer_vpavperpzr_1[:,:,:,ir] + begin_vperp_vpa_region() + update_electron_speed_z!(z_advect[1], upar, vth, vpa.grid, ir) + @loop_vperp_vpa ivperp ivpa begin + @views z_advect[1].adv_fac[:,ivpa,ivperp,ir] = -z_speed[:,ivpa,ivperp] + end + #calculate the upwind derivative + @views derivative_z_pdf_vpavperpz!(dpdf_dz, f_electron_new, + z_advect[1].adv_fac[:,:,:,ir], + scratch_dummy.buffer_vpavperpr_1[:,:,ir], + scratch_dummy.buffer_vpavperpr_2[:,:,ir], + scratch_dummy.buffer_vpavperpr_3[:,:,ir], + scratch_dummy.buffer_vpavperpr_4[:,:,ir], + scratch_dummy.buffer_vpavperpr_5[:,:,ir], + scratch_dummy.buffer_vpavperpr_6[:,:,ir], + z_spectral, z) + + dpdf_dvpa = @view scratch_dummy.buffer_vpavperpzr_2[:,:,:,ir] + begin_z_vperp_region() + update_electron_speed_vpa!(vpa_advect[1], dens, upar, + electron_ppar_new, moments, vpa.grid, + external_source_settings.electron, ir) + @loop_z_vperp iz ivperp begin + @views @. vpa_advect[1].adv_fac[:,ivperp,iz,ir] = -vpa_advect[1].speed[:,ivperp,iz,ir] + end + #calculate the upwind derivative of the electron pdf w.r.t. wpa + @loop_z_vperp iz ivperp begin + @views derivative!(dpdf_dvpa[:,ivperp,iz], f_electron_new[:,ivperp,iz], vpa, + vpa_advect[1].adv_fac[:,ivperp,iz,ir], vpa_spectral) + end + + zeroth_moment = z.scratch_shared + first_moment = z.scratch_shared2 + second_moment = z.scratch_shared3 + begin_z_region() + vpa_grid = vpa.grid + vpa_wgts = vpa.wgts + @loop_z iz begin + @views zeroth_moment[iz] = integrate_over_vspace(f_electron_new[:,1,iz], vpa_wgts) + @views first_moment[iz] = integrate_over_vspace(f_electron_new[:,1,iz], vpa_grid, vpa_wgts) + @views second_moment[iz] = integrate_over_vspace(f_electron_new[:,1,iz], vpa_grid, 2, vpa_wgts) + end + + v_size = vperp.n * vpa.n + + # Do setup for 'v solves' + v_solve_counter = 0 + A = adi_info.v_solve_matrix_buffer + explicit_J = adi_info.J_buffer + # Get sparse matrix for explicit, right-hand-side part of the + # solve. + if adi_info.n_extra_iterations > 0 + # If we only do one 'iteration' we don't need the 'explicit + # matrix' for the first solve (the v-solve), because the initial + # guess is zero, + fill_electron_kinetic_equation_Jacobian!( + explicit_J, f_electron_new, electron_ppar_new, moments, + phi, collisions, composition, z, vperp, vpa, z_spectral, + vperp_spectral, vpa_spectral, z_advect, vpa_advect, + scratch_dummy, external_source_settings, num_diss_params, + t_params, ion_dt, ir, evolve_ppar, :explicit_z, false) + end + begin_z_region() + @loop_z iz begin + v_solve_counter += 1 + # Get LU-factorized matrix for implicit part of the solve + @views fill_electron_kinetic_equation_v_only_Jacobian!( + A, f_electron_new[:,:,iz], electron_ppar_new[iz], + dpdf_dz[:,:,iz], dpdf_dvpa[:,:,iz], z_speed, moments, + zeroth_moment[iz], first_moment[iz], second_moment[iz], + third_moment[iz], dthird_moment_dz[iz], phi[iz], collisions, + composition, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, + external_source_settings, num_diss_params, t_params, ion_dt, + ir, iz, evolve_ppar) + A_sparse = sparse(A) + if !isassigned(adi_info.v_solve_implicit_lus, v_solve_counter) + @timeit_debug global_timer "lu" adi_info.v_solve_implicit_lus[v_solve_counter] = lu(A_sparse) + else + # LU decomposition was previously created. The Jacobian always + # has the same sparsity pattern, so by using `lu!()` we can + # reuse some setup. + try + @timeit_debug global_timer "lu!" lu!(adi_info.v_solve_implicit_lus[v_solve_counter], A_sparse; check=false) + catch e + if !isa(e, ArgumentError) + rethrow(e) + end + println("Sparsity pattern of matrix changed, rebuilding " + * " LU from scratch ir=$ir, iz=$iz") + @timeit_debug global_timer "lu" adi_info.v_solve_implicit_lus[v_solve_counter] = lu(A_sparse) + end + end + + if adi_info.n_extra_iterations > 0 + # If we only do one 'iteration' we don't need the 'explicit + # matrix' for the first solve (the v-solve), because the + # initial guess is zero, + adi_info.v_solve_explicit_matrices[v_solve_counter] = sparse(@view(explicit_J[adi_info.v_solve_global_inds[v_solve_counter],:])) + end + end + @boundscheck v_solve_counter == adi_info.v_solve_nsolve || error("v_solve_counter($v_solve_counter) != v_solve_nsolve($(adi_info.v_solve_nsolve))") + + # Do setup for 'z solves' + z_solve_counter = 0 + A = adi_info.z_solve_matrix_buffer + explicit_J = adi_info.J_buffer + # Get sparse matrix for explicit, right-hand-side part of the + # solve. + fill_electron_kinetic_equation_Jacobian!( + explicit_J, f_electron_new, electron_ppar_new, moments, phi, + collisions, composition, z, vperp, vpa, z_spectral, + vperp_spectral, vpa_spectral, z_advect, vpa_advect, scratch_dummy, + external_source_settings, num_diss_params, t_params, ion_dt, ir, + evolve_ppar, :explicit_v, false) + begin_vperp_vpa_region() + @loop_vperp_vpa ivperp ivpa begin + z_solve_counter += 1 + + # Get LU-factorized matrix for implicit part of the solve + @views fill_electron_kinetic_equation_z_only_Jacobian_f!( + A, f_electron_new[ivpa,ivperp,:], electron_ppar_new, + dpdf_dz[ivpa,ivperp,:], dpdf_dvpa[ivpa,ivperp,:], z_speed, + moments, zeroth_moment, first_moment, second_moment, + third_moment, dthird_moment_dz, collisions, composition, z, + vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, + z_advect, vpa_advect, scratch_dummy, external_source_settings, + num_diss_params, t_params, ion_dt, ir, ivperp, ivpa, + evolve_ppar) + + A_sparse = sparse(A) + if !isassigned(adi_info.z_solve_implicit_lus, z_solve_counter) + @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) + else + # LU decomposition was previously created. The Jacobian always + # has the same sparsity pattern, so by using `lu!()` we can + # reuse some setup. + try + @timeit_debug global_timer "lu!" lu!(adi_info.z_solve_implicit_lus[z_solve_counter], A_sparse; check=false) + catch e + if !isa(e, ArgumentError) + rethrow(e) + end + println("Sparsity pattern of matrix changed, rebuilding " + * " LU from scratch ir=$ir, ivperp=$ivperp, ivpa=$ivpa") + @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) + end + end + + adi_info.z_solve_explicit_matrices[z_solve_counter] = sparse(@view(explicit_J[adi_info.z_solve_global_inds[z_solve_counter],:])) + end + begin_serial_region(; no_synchronize=true) + @serial_region begin + # Do the solve for ppar on the rank-0 process, which has the + # fewest grid points to handle if there are not an exactly equal + # number of points for each process. + z_solve_counter += 1 + + # Get LU-factorized matrix for implicit part of the solve + @views fill_electron_kinetic_equation_z_only_Jacobian_ppar!( + A, electron_ppar_new, moments, zeroth_moment, first_moment, + second_moment, third_moment, dthird_moment_dz, collisions, + composition, z, vperp, vpa, z_spectral, vperp_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, + external_source_settings, num_diss_params, t_params, ion_dt, + ir, evolve_ppar) + + A_sparse = sparse(A) + if !isassigned(adi_info.z_solve_implicit_lus, z_solve_counter) + @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) + else + # LU decomposition was previously created. The Jacobian always + # has the same sparsity pattern, so by using `lu!()` we can + # reuse some setup. + try + @timeit_debug global_timer "lu!" lu!(adi_info.z_solve_implicit_lus[z_solve_counter], A_sparse; check=false) + catch e + if !isa(e, ArgumentError) + rethrow(e) + end + println("Sparsity pattern of matrix changed, rebuilding " + * " LU from scratch ir=$ir, ppar z-solve") + @timeit_debug global_timer "lu" adi_info.z_solve_implicit_lus[z_solve_counter] = lu(A_sparse) + end + end + + adi_info.z_solve_explicit_matrices[z_solve_counter] = sparse(@view(explicit_J[adi_info.z_solve_global_inds[z_solve_counter],:])) + end + @boundscheck z_solve_counter == adi_info.z_solve_nsolve || error("z_solve_counter($z_solve_counter) != z_solve_nsolve($(adi_info.z_solve_nsolve))") + end + + @timeit_debug global_timer adi_precon!(x) = begin + precon_ppar, precon_f = x + + adi_info = nl_solver_params.preconditioners[ir] + precon_iterations = nl_solver_params.precon_iterations + this_input_buffer = adi_info.input_buffer + this_intermediate_buffer = adi_info.intermediate_buffer + this_output_buffer = adi_info.output_buffer + global_index_subrange = adi_info.global_index_subrange + n_extra_iterations = adi_info.n_extra_iterations + + v_size = vperp.n * vpa.n + pdf_size = z.n * v_size + + # Use these views to communicate block-boundary points + output_buffer_pdf_view = reshape(@view(this_output_buffer[1:pdf_size]), size(precon_f)) + output_buffer_ppar_view = @view(this_output_buffer[pdf_size+1:end]) + f_lower_endpoints = @view scratch_dummy.buffer_vpavperpr_1[:,:,ir] + f_upper_endpoints = @view scratch_dummy.buffer_vpavperpr_2[:,:,ir] + receive_buffer1 = @view scratch_dummy.buffer_vpavperpr_3[:,:,ir] + receive_buffer2 = @view scratch_dummy.buffer_vpavperpr_4[:,:,ir] + + function adi_communicate_boundary_points() + # Ensure values of precon_f and precon_ppar are consistent across + # distributed-MPI block boundaries. For precon_f take the upwind + # value, and for precon_ppar take the average. + begin_vperp_vpa_region() + @loop_vperp_vpa ivperp ivpa begin + f_lower_endpoints[ivpa,ivperp] = output_buffer_pdf_view[ivpa,ivperp,1] + f_upper_endpoints[ivpa,ivperp] = output_buffer_pdf_view[ivpa,ivperp,end] + end + # We upwind the z-derivatives in `electron_z_advection!()`, so would + # expect that upwinding the results here in z would make sense. + # However, upwinding here makes convergence much slower (~10x), + # compared to picking the values from one side or other of the block + # boundary, or taking the average of the values on either side. + # Neither direction is special, so taking the average seems most + # sensible (although in an intial test it does not seem to converge + # faster than just picking one or the other). + # Maybe this could indicate that it is more important to have a fully + # self-consistent Jacobian inversion for the + # `electron_vpa_advection()` part rather than taking half(ish) of the + # values from one block and the other half(ish) from the other. + reconcile_element_boundaries_MPI_z_pdf_vpavperpz!( + output_buffer_pdf_view, f_lower_endpoints, f_upper_endpoints, receive_buffer1, + receive_buffer2, z) + + begin_serial_region() + @serial_region begin + buffer_1[] = output_buffer_ppar_view[1] + buffer_2[] = output_buffer_ppar_view[end] + end + reconcile_element_boundaries_MPI!( + output_buffer_ppar_view, buffer_1, buffer_2, buffer_3, buffer_4, z) + + return nothing + end + + begin_z_vperp_vpa_region() + @loop_z_vperp_vpa iz ivperp ivpa begin + row = (iz - 1)*v_size + (ivperp - 1)*vpa.n + ivpa + this_input_buffer[row] = precon_f[ivpa,ivperp,iz] + end + begin_z_region() + @loop_z iz begin + row = pdf_size + iz + this_input_buffer[row] = precon_ppar[iz] + end + _block_synchronize() + + # Use this to copy current guess from output_buffer to + # intermediate_buffer, to avoid race conditions as new guess is + # written into output_buffer. + function fill_intermediate_buffer!() + _block_synchronize() + for i ∈ global_index_subrange + this_intermediate_buffer[i] = this_output_buffer[i] + end + _block_synchronize() + end + + v_solve_global_inds = adi_info.v_solve_global_inds + v_solve_nsolve = adi_info.v_solve_nsolve + v_solve_implicit_lus = adi_info.v_solve_implicit_lus + v_solve_explicit_matrices = adi_info.v_solve_explicit_matrices + v_solve_buffer = adi_info.v_solve_buffer + v_solve_buffer2 = adi_info.v_solve_buffer2 + function first_adi_v_solve!() + # The initial guess is all-zero, so for the first solve there is + # no need to multiply by the 'explicit matrix' as x==0, so E.x==0 + for isolve ∈ 1:v_solve_nsolve + this_inds = v_solve_global_inds[isolve] + v_solve_buffer .= this_input_buffer[this_inds] + @timeit_debug global_timer "ldiv!" ldiv!(v_solve_buffer2, v_solve_implicit_lus[isolve], v_solve_buffer) + this_output_buffer[this_inds] .= v_solve_buffer2 + end + end + function adi_v_solve!() + for isolve ∈ 1:v_solve_nsolve + this_inds = v_solve_global_inds[isolve] + v_solve_buffer .= @view this_input_buffer[this_inds] + # Need to multiply the 'explicit matrix' by -1, because all + # the Jacobian-calculation functions are defined as if the + # terms are being added to the left-hand-side preconditioner + # matrix, but here the 'explicit matrix' terms are added on + # the right-hand-side. + @timeit_debug global_timer "mul!" mul!(v_solve_buffer, v_solve_explicit_matrices[isolve], + this_intermediate_buffer, -1.0, 1.0) + @timeit_debug global_timer "ldiv!" ldiv!(v_solve_buffer2, v_solve_implicit_lus[isolve], v_solve_buffer) + this_output_buffer[this_inds] .= v_solve_buffer2 + end + end + + z_solve_global_inds = adi_info.z_solve_global_inds + z_solve_nsolve = adi_info.z_solve_nsolve + z_solve_implicit_lus = adi_info.z_solve_implicit_lus + z_solve_explicit_matrices = adi_info.z_solve_explicit_matrices + z_solve_buffer = adi_info.z_solve_buffer + z_solve_buffer2 = adi_info.z_solve_buffer2 + function adi_z_solve!() + for isolve ∈ 1:z_solve_nsolve + this_inds = z_solve_global_inds[isolve] + z_solve_buffer .= @view this_input_buffer[this_inds] + # Need to multiply the 'explicit matrix' by -1, because all + # the Jacobian-calculation functions are defined as if the + # terms are being added to the left-hand-side preconditioner + # matrix, but here the 'explicit matrix' terms are added on + # the right-hand-side. + @timeit_debug global_timer "mul!" mul!(z_solve_buffer, z_solve_explicit_matrices[isolve], this_intermediate_buffer, -1.0, 1.0) + @timeit_debug global_timer "ldiv!" ldiv!(z_solve_buffer2, z_solve_implicit_lus[isolve], z_solve_buffer) + this_output_buffer[this_inds] .= z_solve_buffer2 + end + end + + precon_iterations[] += 1 + first_adi_v_solve!() + fill_intermediate_buffer!() + adi_z_solve!() + adi_communicate_boundary_points() + + for n ∈ 1:n_extra_iterations + precon_iterations[] += 1 + fill_intermediate_buffer!() + adi_v_solve!() + fill_intermediate_buffer!() + adi_z_solve!() + adi_communicate_boundary_points() + end + + # Unpack preconditioner solution + begin_z_vperp_vpa_region() + @loop_z_vperp_vpa iz ivperp ivpa begin + row = (iz - 1)*v_size + (ivperp - 1)*vpa.n + ivpa + precon_f[ivpa,ivperp,iz] = this_output_buffer[row] + end + begin_z_region() + @loop_z iz begin + row = pdf_size + iz + precon_ppar[iz] = this_output_buffer[row] + end + + return nothing + end + + left_preconditioner = identity + right_preconditioner = adi_precon! + elseif nl_solver_params.preconditioner_type === Val(:none) + left_preconditioner = identity + right_preconditioner = identity + else + error("preconditioner_type=$(nl_solver_params.preconditioner_type) is not " + * "supported by electron_backward_euler!().") + end + + # Do a backward-Euler update of the electron pdf, and (if evove_ppar=true) the + # electron parallel pressure. + function residual_func!(this_residual, new_variables; krylov=false) + electron_ppar_residual, f_electron_residual = this_residual + electron_ppar_newvar, f_electron_newvar = new_variables + + if evolve_ppar + this_dens = moments.electron.dens + this_upar = moments.electron.upar + this_vth = moments.electron.vth + begin_z_region() + @loop_z iz begin + # update the electron thermal speed using the updated electron + # parallel pressure + this_vth[iz,ir] = sqrt(abs(2.0 * electron_ppar_newvar[iz] / + (this_dens[iz,ir] * + composition.me_over_mi))) + end + end + + # enforce the boundary condition(s) on the electron pdf + @views enforce_boundary_condition_on_electron_pdf!( + f_electron_newvar, phi, moments.electron.vth[:,ir], + moments.electron.upar[:,ir], z, vperp, vpa, vperp_spectral, + vpa_spectral, vpa_advect, moments, + num_diss_params.electron.vpa_dissipation_coefficient > 0.0, + composition.me_over_mi, ir; bc_constraints=false, + update_vcut=!krylov) + + if evolve_ppar + # Calculate heat flux and derivatives using new_variables + @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], + electron_ppar_newvar, + moments.electron.vth[:,ir], + f_electron_newvar, vpa, + ir) + + calculate_electron_moment_derivatives_no_r!( + moments, + (electron_density=this_dens, + electron_upar=this_upar, + electron_ppar=electron_ppar_newvar), + scratch_dummy, z, z_spectral, + num_diss_params.electron.moment_dissipation_coefficient, ir) + else + # Calculate heat flux and derivatives using new_variables + @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], + electron_ppar_newvar, + moments.electron.vth[:,ir], + f_electron_newvar, vpa, + ir) + # compute the z-derivative of the parallel electron heat flux + @views derivative_z!(moments.electron.dqpar_dz[:,ir], + moments.electron.qpar[:,ir], buffer_1, buffer_2, + buffer_3, buffer_4, z_spectral, z) + end + + if evolve_ppar + begin_z_region() + @loop_z iz begin + electron_ppar_residual[iz] = electron_ppar_old[iz,ir] + end + else + begin_z_region() + @loop_z iz begin + electron_ppar_residual[iz] = 0.0 + end + end + + # electron_kinetic_equation_euler_update!() just adds dt*d(g_e)/dt to the + # electron_pdf member of the first argument, so if we set the electron_pdf member + # of the first argument to zero, and pass dt=1, then it will evaluate the time + # derivative, which is the residual for a steady-state solution. + begin_z_vperp_vpa_region() + @loop_z_vperp_vpa iz ivperp ivpa begin + f_electron_residual[ivpa,ivperp,iz] = f_electron_old[ivpa,ivperp,iz] + end + electron_kinetic_equation_euler_update!( + f_electron_residual, electron_ppar_residual, f_electron_newvar, + electron_ppar_newvar, moments, z, vperp, vpa, z_spectral, + vpa_spectral, z_advect, vpa_advect, scratch_dummy, collisions, + composition, external_source_settings, num_diss_params, t_params, + ir; evolve_ppar=evolve_ppar, ion_dt=ion_dt, + soft_force_constraints=true) + + # Now + # residual = f_electron_old + dt*RHS(f_electron_newvar) + # so update to desired residual + begin_z_vperp_vpa_region() + @loop_z_vperp_vpa iz ivperp ivpa begin + f_electron_residual[ivpa,ivperp,iz] = f_electron_newvar[ivpa,ivperp,iz] - f_electron_residual[ivpa,ivperp,iz] + end + if evolve_ppar + begin_z_region() + @loop_z iz begin + electron_ppar_residual[iz] = electron_ppar_newvar[iz] - electron_ppar_residual[iz] + end + end + + # Set residual to zero where pdf_electron is determined by boundary conditions. + if vpa.n > 1 + begin_z_vperp_region() + @loop_z_vperp iz ivperp begin + @views enforce_v_boundary_condition_local!(f_electron_residual[:,ivperp,iz], vpa.bc, + vpa_advect[1].speed[:,ivperp,iz,ir], + num_diss_params.electron.vpa_dissipation_coefficient > 0.0, + vpa, vpa_spectral) + end + end + if vperp.n > 1 + begin_z_vpa_region() + enforce_vperp_boundary_condition!(f_electron_residual, vperp.bc, + vperp, vperp_spectral, vperp_adv, + vperp_diffusion, ir) + end + zero_z_boundary_condition_points(f_electron_residual, z, vpa, moments, ir) + + return nothing + end + + residual = (scratch_dummy.implicit_buffer_z_1, scratch_dummy.implicit_buffer_vpavperpz_1) + delta_x = (scratch_dummy.implicit_buffer_z_2, + scratch_dummy.implicit_buffer_vpavperpz_2) + rhs_delta = (scratch_dummy.implicit_buffer_z_3, + scratch_dummy.implicit_buffer_vpavperpz_3) + v = (scratch_dummy.implicit_buffer_z_4, + scratch_dummy.implicit_buffer_vpavperpz_4) + w = (scratch_dummy.implicit_buffer_z_5, + scratch_dummy.implicit_buffer_vpavperpz_5) + + newton_success = newton_solve!((electron_ppar_new, f_electron_new), + residual_func!, residual, delta_x, rhs_delta, + v, w, nl_solver_params; + left_preconditioner=left_preconditioner, + right_preconditioner=right_preconditioner, + coords=(z=z, vperp=vperp, vpa=vpa)) + + return newton_success +end + """ implicit_electron_advance!() @@ -2246,23 +2264,68 @@ function apply_electron_bc_and_constraints!(this_scratch, phi, moments, r, z, vp end end -function apply_electron_bc_and_constraints_no_r!(f_electron, phi, moments, z, vperp, +function apply_electron_bc_and_constraints_no_r!(f_electron, phi, moments, r, z, vperp, vpa, vperp_spectral, vpa_spectral, vpa_advect, num_diss_params, composition, - ir; lowerz_vcut_inds=nothing, - upperz_vcut_inds=nothing) + ir, nl_solver_params) begin_z_vperp_vpa_region() @loop_z_vperp_vpa iz ivperp ivpa begin f_electron[ivpa,ivperp,iz] = max(f_electron[ivpa,ivperp,iz], 0.0) end + new_lowerz_vcut_ind = @view r.scratch_shared_int[ir:ir] + new_upperz_vcut_ind = @view r.scratch_shared_int2[ir:ir] + # enforce the boundary condition(s) on the electron pdf @views enforce_boundary_condition_on_electron_pdf!( f_electron, phi, moments.electron.vth[:,ir], moments.electron.upar[:,ir], z, vperp, vpa, vperp_spectral, vpa_spectral, vpa_advect, moments, num_diss_params.electron.vpa_dissipation_coefficient > 0.0, - composition.me_over_mi, ir; lowerz_vcut_inds=lowerz_vcut_inds, - upperz_vcut_inds=upperz_vcut_inds) + composition.me_over_mi, ir; lowerz_vcut_ind=new_lowerz_vcut_ind, + upperz_vcut_ind=new_upperz_vcut_ind) + + # Check if either vcut_ind has changed - if either has, recalculate the + # preconditioner because the response at the grid point before the cutoff is + # sharp, so the preconditioner could be significantly wrong when it was + # calculated using the wrong vcut_ind. + lower_vcut_changed = @view z.scratch_shared_int[1:1] + upper_vcut_changed = @view z.scratch_shared_int[2:2] + @serial_region begin + if z.irank == 0 + precon_lowerz_vcut_inds = nl_solver_params.precon_lowerz_vcut_inds + if new_lowerz_vcut_ind[] == precon_lowerz_vcut_inds[ir] + lower_vcut_changed[] = 0 + else + lower_vcut_changed[] = 1 + precon_lowerz_vcut_inds[ir] = new_lowerz_vcut_ind[] + end + end + MPI.Bcast!(lower_vcut_changed, comm_inter_block[]; root=0) + #req1 = MPI.Ibcast!(lower_vcut_changed, comm_inter_block[]; root=0) + + if z.irank == z.nrank - 1 + precon_upperz_vcut_inds = nl_solver_params.precon_upperz_vcut_inds + if new_upperz_vcut_ind[] == precon_upperz_vcut_inds[ir] + upper_vcut_changed[] = 0 + else + upper_vcut_changed[] = 1 + precon_upperz_vcut_inds[ir] = new_upperz_vcut_ind[] + end + end + MPI.Bcast!(upper_vcut_changed, comm_inter_block[]; root=n_blocks[]-1) + #req2 = MPI.Ibcast!(upper_vcut_changed, comm_inter_block[]; root=n_blocks[]-1) + + # Eventually can use Ibcast!() to make the two broadcasts run + # simultaneously, but need the function to be merged into MPI.jl (see + # https://github.com/JuliaParallel/MPI.jl/pull/882). + #MPI.Waitall([req1, req2]) + end + _block_synchronize() + if lower_vcut_changed[] == 1 || upper_vcut_changed[] == 1 + # One or both of the indices changed for some `ir`, so force the + # preconditioner to be recalculated next time. + nl_solver_params.solves_since_precon_update[] = nl_solver_params.preconditioner_update_interval + end begin_z_region() A = moments.electron.constraints_A_coefficient @@ -2745,8 +2808,8 @@ end @timeit global_timer enforce_boundary_condition_on_electron_pdf!( pdf, phi, vthe, upar, z, vperp, vpa, vperp_spectral, vpa_spectral, vpa_adv, moments, vpa_diffusion, me_over_mi, ir; - bc_constraints=true, update_vcut=true, lowerz_vcut_inds=nothing, - upperz_vcut_inds=nothing) = begin + bc_constraints=true, update_vcut=true, lowerz_vcut_ind=nothing, + upperz_vcut_ind=nothing) = begin @boundscheck bc_constraints && !update_vcut && error("update_vcut is not used when bc_constraints=true, but update_vcut has non-default value") @@ -2946,13 +3009,13 @@ end # plus_vcut_ind+1 where vcut is. vcut_fraction = get_plus_vcut_fraction(vcut, plus_vcut_ind, vpa_unnorm) if vcut_fraction > 0.5 - if lowerz_vcut_inds !== nothing - lowerz_vcut_inds[ir] = plus_vcut_ind+1 + if lowerz_vcut_ind !== nothing + lowerz_vcut_ind[] = plus_vcut_ind+1 end pdf[plus_vcut_ind+1,1,1] *= vcut_fraction - 0.5 else - if lowerz_vcut_inds !== nothing - lowerz_vcut_inds[ir] = plus_vcut_ind + if lowerz_vcut_ind !== nothing + lowerz_vcut_ind[] = plus_vcut_ind end pdf[plus_vcut_ind+1,1,1] = 0.0 pdf[plus_vcut_ind,1,1] *= vcut_fraction + 0.5 @@ -3142,13 +3205,13 @@ end # minus_vcut_ind where -vcut is. vcut_fraction = get_minus_vcut_fraction(vcut, minus_vcut_ind, vpa_unnorm) if vcut_fraction < 0.5 - if upperz_vcut_inds !== nothing - upperz_vcut_inds[ir] = minus_vcut_ind-1 + if upperz_vcut_ind !== nothing + upperz_vcut_ind[] = minus_vcut_ind-1 end pdf[minus_vcut_ind-1,1,end] *= 0.5 - vcut_fraction else - if upperz_vcut_inds !== nothing - upperz_vcut_inds[ir] = minus_vcut_ind + if upperz_vcut_ind !== nothing + upperz_vcut_ind[] = minus_vcut_ind end pdf[minus_vcut_ind-1,1,end] = 0.0 pdf[minus_vcut_ind,1,end] *= 1.5 - vcut_fraction From b85465a28ce855563be544b42abac8cf8cf90b4b Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 7 Dec 2024 18:00:00 +0000 Subject: [PATCH 04/23] Fix adaptive timestep resetting if electron pseudotimestep loop fails --- moment_kinetics/src/time_advance.jl | 50 +++++++++++++++++------------ 1 file changed, 30 insertions(+), 20 deletions(-) diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index 2c5704935..e5b7a1720 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -3101,7 +3101,7 @@ end # which is used as input to the explicit part of the IMEX time step. old_scratch = scratch_implicit[istage] update_electrons = !(t_params.implicit_electron_advance || t_params.implicit_electron_ppar) - success = apply_all_bcs_constraints_update_moments!( + bcs_constraints_success = apply_all_bcs_constraints_update_moments!( scratch_implicit[istage], pdf, moments, fields, boundary_distributions, scratch_electron, vz, vr, vzeta, vpa, vperp, z, r, spectral_objects, advect_objects, composition, collisions, @@ -3109,6 +3109,9 @@ end t_params, nl_solver_params, advance, scratch_dummy, false, max_electron_pdf_iterations, max_electron_sim_time; update_electrons=update_electrons) + if bcs_constraints_success != "" + success = bcs_constrains_success + end if success != "" # Break out of the istage loop, as passing `success != ""` to the # adaptive timestep update function will signal a failed timestep, so @@ -3148,7 +3151,7 @@ end update_electrons = (t_params.rk_coefs_implicit === nothing || !(t_params.implicit_electron_advance || t_params.implicit_electron_ppar)) diagnostic_moments = diagnostic_checks && istage == n_rk_stages - success = apply_all_bcs_constraints_update_moments!( + bcs_constraints_success = apply_all_bcs_constraints_update_moments!( scratch[istage+1], pdf, moments, fields, boundary_distributions, scratch_electron, vz, vr, vzeta, vpa, vperp, z, r, spectral_objects, advect_objects, composition, collisions, geometry, gyroavs, @@ -3156,6 +3159,9 @@ end advance, scratch_dummy, diagnostic_moments, max_electron_pdf_iterations, max_electron_sim_time; pdf_bc_constraints=apply_bc_constraints, update_electrons=update_electrons) + if bcs_constraints_success != "" + success = bcs_constrains_success + end if success != "" # Break out of the istage loop, as passing `success != ""` to the # adaptive timestep update function will signal a failed timestep, so @@ -3585,6 +3591,7 @@ end electron_z_advect, electron_vpa_advect = advect_objects.electron_z_advect, advect_objects.electron_vpa_advect neutral_z_advect, neutral_r_advect, neutral_vz_advect = advect_objects.neutral_z_advect, advect_objects.neutral_r_advect, advect_objects.neutral_vz_advect + success = true if t_params.implicit_electron_advance electron_success = implicit_electron_advance!(fvec_out, fvec_in, pdf, scratch_electron, moments, fields, @@ -3599,7 +3606,7 @@ end dt, nl_solver_params.electron_advance) - success = (electron_success == "") + success = success && (electron_success == "") elseif t_params.implicit_electron_ppar max_electron_pdf_iterations = t_params.electron.max_pseudotimesteps max_electron_sim_time = t_params.electron.max_pseudotime @@ -3623,7 +3630,7 @@ end fvec_out_electron_ppar[iz,ir] = moments_electron_ppar[iz,ir] end - success = (electron_success == "") + success = success && (electron_success == "") elseif advance.electron_conduction success = implicit_braginskii_conduction!(fvec_out, fvec_in, moments, z, r, dt, @@ -3633,23 +3640,26 @@ end end if nl_solver_params.ion_advance !== nothing - success = implicit_ion_advance!(fvec_out, fvec_in, pdf, fields, moments, - advect_objects, vz, vr, vzeta, vpa, vperp, - gyrophase, z, r, t_params.t[], dt, - spectral_objects, composition, collisions, - geometry, scratch_dummy, manufactured_source_list, - external_source_settings, num_diss_params, - gyroavs, nl_solver_params.ion_advance, advance, - fp_arrays, istage) + ion_success = implicit_ion_advance!(fvec_out, fvec_in, pdf, fields, moments, + advect_objects, vz, vr, vzeta, vpa, vperp, + gyrophase, z, r, t_params.t[], dt, + spectral_objects, composition, collisions, + geometry, scratch_dummy, + manufactured_source_list, + external_source_settings, num_diss_params, + gyroavs, nl_solver_params.ion_advance, + advance, fp_arrays, istage) + success = success && ion_success elseif advance.vpa_advection - success = implicit_vpa_advection!(fvec_out.pdf, fvec_in, fields, moments, - z_advect, vpa_advect, vpa, vperp, z, r, dt, - t_params.t[], r_spectral, z_spectral, - vpa_spectral, composition, collisions, - external_source_settings.ion, geometry, - nl_solver_params.vpa_advection, - advance.vpa_diffusion, num_diss_params, gyroavs, - scratch_dummy) + ion_success = implicit_vpa_advection!(fvec_out.pdf, fvec_in, fields, moments, + z_advect, vpa_advect, vpa, vperp, z, r, dt, + t_params.t[], r_spectral, z_spectral, + vpa_spectral, composition, collisions, + external_source_settings.ion, geometry, + nl_solver_params.vpa_advection, + advance.vpa_diffusion, num_diss_params, + gyroavs, scratch_dummy) + success = success && ion_success end return success From 29b4703d3f762d896e022e1be778d26e9b2a2555 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 7 Dec 2024 18:02:55 +0000 Subject: [PATCH 05/23] Option to time-evolve the electron shape function Uses an implicit timestep so that the electron shape function can be advanced with the ion timestep. Does not test the accuracy of the timestep for the electron shape function, so that the error control on the timestepper does not try to resolve fast electron dynamics. Can be used to find steady state, because then dg_e/dt=0 in the steady state anyway, so there is no error. When the time-dependence is needed, dg_e/dt should be a mass-ratio-small term, so maybe is OK anyway? --- .../src/electron_fluid_equations.jl | 7 +- .../src/electron_kinetic_equation.jl | 8 +- moment_kinetics/src/file_io.jl | 23 ++- moment_kinetics/src/initial_conditions.jl | 8 + moment_kinetics/src/input_structs.jl | 2 + moment_kinetics/src/moment_kinetics_input.jl | 1 + .../src/moment_kinetics_structs.jl | 1 + moment_kinetics/src/time_advance.jl | 170 +++++++++++++++--- util/precompile_run.jl | 1 + util/precompile_run_kinetic-electrons.jl | 3 +- 10 files changed, 184 insertions(+), 40 deletions(-) diff --git a/moment_kinetics/src/electron_fluid_equations.jl b/moment_kinetics/src/electron_fluid_equations.jl index bd2f1cdbb..516e81161 100644 --- a/moment_kinetics/src/electron_fluid_equations.jl +++ b/moment_kinetics/src/electron_fluid_equations.jl @@ -127,6 +127,11 @@ end function calculate_electron_moments!(scratch, pdf, moments, composition, collisions, r, z, vpa) + if length(scratch.pdf_electron) > 0 + pdf_electron = scratch.pdf_electron + else + pdf_electron = pdf.electron + end calculate_electron_density!(scratch.electron_density, moments.electron.dens_updated, scratch.density) calculate_electron_upar_from_charge_conservation!( @@ -144,7 +149,7 @@ function calculate_electron_moments!(scratch, pdf, moments, composition, collisi end update_electron_vth_temperature!(moments, scratch.electron_ppar, scratch.electron_density, composition) - calculate_electron_qpar!(moments.electron, pdf.electron, scratch.electron_ppar, + calculate_electron_qpar!(moments.electron, pdf_electron, scratch.electron_ppar, scratch.electron_upar, scratch.upar, collisions.electron_fluid.nu_ei, composition.me_over_mi, composition.electron_physics, vpa) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 96fed0d93..ebf96ae89 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -898,6 +898,10 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, # to arrays, because f_electron_old and electron_ppar_old are captured by # residual_func!() above, so any change in the things they refer to will # cause type instability in residual_func!(). + f_electron_new = @view new_scratch.pdf_electron[:,:,:,ir] + f_electron_old = @view old_scratch.pdf_electron[:,:,:,ir] + electron_ppar_new = @view new_scratch.electron_ppar[:,ir] + electron_ppar_old = @view old_scratch.electron_ppar[:,ir] begin_z_vperp_vpa_region() @loop_z_vperp_vpa iz ivperp ivpa begin f_electron_new[ivpa,ivperp,iz] = f_electron_old[ivpa,ivperp,iz] @@ -930,6 +934,8 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, end end + reset_nonlinear_per_stage_counters!(nl_solver_params) + residual_norm = -1.0 if step_success # Calculate residuals to decide if iteration is converged. @@ -999,8 +1005,6 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, end end - reset_nonlinear_per_stage_counters!(nl_solver_params) - t_params.step_counter[] += 1 if electron_pdf_converged[] break diff --git a/moment_kinetics/src/file_io.jl b/moment_kinetics/src/file_io.jl index c61cf9458..e64c8c9f9 100644 --- a/moment_kinetics/src/file_io.jl +++ b/moment_kinetics/src/file_io.jl @@ -3277,9 +3277,9 @@ binary output file # add the distribution function data at this time slice to the output file write_ion_dfns_data_to_binary(scratch, t_params, n_ion_species, io_dfns, t_idx, r, z, vperp, vpa) - if scratch_electron !== nothing - write_electron_dfns_data_to_binary(scratch_electron, t_params, io_dfns, t_idx, - r, z, vperp, vpa) + if t_params.implicit_electron_time_evolving || scratch_electron !== nothing + write_electron_dfns_data_to_binary(scratch, scratch_electron, t_params, + io_dfns, t_idx, r, z, vperp, vpa) end write_neutral_dfns_data_to_binary(scratch, t_params, n_neutral_species, io_dfns, t_idx, r, z, vzeta, vr, vz) @@ -3318,7 +3318,7 @@ write time-dependent distribution function data for electrons to the binary outp Note: should only be called from within a function that (re-)opens the output file. """ -function write_electron_dfns_data_to_binary(scratch_electron, t_params, +function write_electron_dfns_data_to_binary(scratch, scratch_electron, t_params, io_dfns::Union{io_dfns_info,io_initial_electron_info}, t_idx, r, z, vperp, vpa) @serial_region begin @@ -3327,22 +3327,27 @@ function write_electron_dfns_data_to_binary(scratch_electron, t_params, parallel_io = io_dfns.io_input.parallel_io if io_dfns.f_electron !== nothing - if t_params.electron === nothing + if t_params.implicit_electron_time_evolving + n_rk_stages = t_params.n_rk_stages + this_scratch = scratch + elseif t_params.electron === nothing # t_params is the t_params for electron timestepping n_rk_stages = t_params.n_rk_stages + this_scratch = scratch_electron else n_rk_stages = t_params.electron.n_rk_stages + this_scratch = scratch_electron end append_to_dynamic_var(io_dfns.f_electron, - scratch_electron[n_rk_stages+1].pdf_electron, + this_scratch[n_rk_stages+1].pdf_electron, t_idx, parallel_io, vpa, vperp, z, r) # If options were not set to select the following outputs, then the io # variables will be `nothing` and nothing will be written. append_to_dynamic_var(io_dfns.f_electron_loworder, - scratch_electron[2].pdf_electron, + this_scratch[2].pdf_electron, t_idx, parallel_io, vpa, vperp, z, r) append_to_dynamic_var(io_dfns.f_electron_start_last_timestep, - scratch_electron[1].pdf_electron, + this_scratch[1].pdf_electron, t_idx, parallel_io, vpa, vperp, z, r) end end @@ -3408,7 +3413,7 @@ function write_electron_state(scratch_electron, moments, t_params, append_to_dynamic_var(io_initial_electron.electron_cumulative_pseudotime, t_params.t[], t_idx, parallel_io) - write_electron_dfns_data_to_binary(scratch_electron, t_params, + write_electron_dfns_data_to_binary(nothing, scratch_electron, t_params, io_initial_electron, t_idx, r, z, vperp, vpa) write_electron_moments_data_to_binary(scratch_electron, moments, t_params, diff --git a/moment_kinetics/src/initial_conditions.jl b/moment_kinetics/src/initial_conditions.jl index ca9856868..0e7af0346 100644 --- a/moment_kinetics/src/initial_conditions.jl +++ b/moment_kinetics/src/initial_conditions.jl @@ -816,6 +816,14 @@ function initialize_electron_pdf!(scratch, scratch_electron, pdf, moments, field pdf.electron.pdf_before_ion_timestep[ivpa,ivperp,iz,ir] = pdf.electron.norm[ivpa,ivperp,iz,ir] end + if length(scratch[1].pdf_electron) > 0 + @loop_r_z_vperp_vpa ir iz ivperp ivpa begin + for i ∈ 1:length(scratch) + scratch[i].pdf_electron[ivpa,ivperp,iz,ir] = + pdf.electron.norm[ivpa,ivperp,iz,ir] + end + end + end # No need to do electron I/O (apart from possibly debug I/O) any more, so if # adaptive timestep is used, it does not need to adjust to output times. diff --git a/moment_kinetics/src/input_structs.jl b/moment_kinetics/src/input_structs.jl index a367b2a68..0a17e7d47 100644 --- a/moment_kinetics/src/input_structs.jl +++ b/moment_kinetics/src/input_structs.jl @@ -79,6 +79,7 @@ struct time_info{Terrorsum <: Real, T_debug_output, T_electron, Trkimp, Timpzero maximum_dt::mk_float implicit_braginskii_conduction::Bool implicit_electron_advance::Bool + implicit_electron_time_evolving::Bool implicit_ion_advance::Bool implicit_vpa_advection::Bool implicit_electron_ppar::Bool @@ -130,6 +131,7 @@ struct advance_info continuity::Bool force_balance::Bool energy::Bool + electron_pdf::Bool electron_energy::Bool electron_conduction::Bool neutral_external_source::Bool diff --git a/moment_kinetics/src/moment_kinetics_input.jl b/moment_kinetics/src/moment_kinetics_input.jl index aaf124309..25b4c8e36 100644 --- a/moment_kinetics/src/moment_kinetics_input.jl +++ b/moment_kinetics/src/moment_kinetics_input.jl @@ -162,6 +162,7 @@ function mk_input(input_dict=OptionsDict(); save_inputs_to_txt=false, ignore_MPI maximum_dt=Inf, implicit_braginskii_conduction=true, implicit_electron_advance=false, + implicit_electron_time_evolving=false, implicit_ion_advance=false, implicit_vpa_advection=false, implicit_electron_ppar=true, diff --git a/moment_kinetics/src/moment_kinetics_structs.jl b/moment_kinetics/src/moment_kinetics_structs.jl index de28014e8..f37ca1019 100644 --- a/moment_kinetics/src/moment_kinetics_structs.jl +++ b/moment_kinetics/src/moment_kinetics_structs.jl @@ -34,6 +34,7 @@ struct scratch_pdf pperp::MPISharedArray{mk_float, ndim_moment} temp_z_s::MPISharedArray{mk_float, ndim_moment} # electrons + pdf_electron::MPISharedArray{mk_float, ndim_pdf_electron} electron_density::MPISharedArray{mk_float, ndim_moment_electron} electron_upar::MPISharedArray{mk_float, ndim_moment_electron} electron_ppar::MPISharedArray{mk_float, ndim_moment_electron} diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index e5b7a1720..97321c142 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -46,7 +46,10 @@ using ..charge_exchange: ion_charge_exchange_collisions_1V!, neutral_charge_exchange_collisions_1V!, ion_charge_exchange_collisions_3V!, neutral_charge_exchange_collisions_3V! -using ..electron_kinetic_equation: update_electron_pdf!, implicit_electron_advance! +using ..electron_kinetic_equation: update_electron_pdf!, implicit_electron_advance!, + electron_backward_euler!, + electron_kinetic_equation_euler_update!, + apply_electron_bc_and_constraints_no_r! using ..ionization: ion_ionization_collisions_1V!, neutral_ionization_collisions_1V!, ion_ionization_collisions_3V!, neutral_ionization_collisions_3V! using ..krook_collisions: krook_collisions! @@ -384,6 +387,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, # Not an IMEX scheme, so cannot have any implicit terms t_input["implicit_braginskii_conduction"] = false t_input["implicit_electron_advance"] = false + t_input["implicit_electron_time_evolving"] = false t_input["implicit_ion_advance"] = false t_input["implicit_vpa_advection"] = false t_input["implicit_electron_ppar"] = false @@ -394,6 +398,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, if composition.electron_physics ∉ (kinetic_electrons, kinetic_electrons_with_temperature_equation) t_input["implicit_electron_advance"] = false + t_input["implicit_electron_time_evolving"] = false t_input["implicit_electron_ppar"] = false end end @@ -426,6 +431,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, implicit_electron_ppar = false implicit_electron_advance = false + implicit_electron_time_evolving = false electron_preconditioner_type = nothing decrease_dt_iteration_threshold = t_input["decrease_dt_iteration_threshold"] increase_dt_iteration_threshold = t_input["increase_dt_iteration_threshold"] @@ -438,6 +444,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, debug_io = nothing implicit_electron_ppar = false implicit_electron_advance = false + implicit_electron_time_evolving = false electron_preconditioner_type = nothing decrease_dt_iteration_threshold = -1 increase_dt_iteration_threshold = typemax(mk_int) @@ -451,6 +458,8 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, implicit_electron_ppar = (t_input["implicit_electron_ppar"] !== false) implicit_electron_advance = (t_input["implicit_electron_advance"] !== false) + implicit_electron_time_evolving = (t_input["implicit_electron_time_evolving"] !== false) + electron_precon_types = Dict("lu" => :electron_lu, "adi" => :electron_adi) if implicit_electron_ppar if t_input["implicit_electron_ppar"] === true if block_size[] == 1 @@ -461,7 +470,6 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, electron_preconditioner_type = Val(:electron_adi) end else - electron_precon_types = Dict("lu" => :electron_lu, "adi" => :electron_adi) if t_input["implicit_electron_ppar"] ∈ keys(electron_precon_types) electron_preconditioner_type = Val(electron_precon_types[t_input["implicit_electron_ppar"]]) else @@ -478,6 +486,26 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, * "implicit_electron_advance.") end electron_preconditioner_type = Val(:electron_lu) + elseif implicit_electron_time_evolving + if t_input["implicit_electron_time_evolving"] === true + if block_size[] == 1 + # No need to parallelise, so un-split LU solver should be most efficient. + electron_preconditioner_type = Val(:electron_lu) + else + # Want to parallelise preconditioner, so use ADI method. + electron_preconditioner_type = Val(:electron_adi) + end + else + if t_input["implicit_electron_time_evolving"] ∈ keys(electron_precon_types) + electron_preconditioner_type = Val(electron_precon_types[t_input["implicit_electron_time_evolving"]]) + else + precon_keys = collect(keys(electron_precon_types)) + error("Unrecognised option implicit_electron_time_evolving=" + * "\"$(t_input["implicit_electron_time_evolving"])\" which " + * "should be either false/true or a string giving the type of " + * "preconditioner to use - one of $precon_keys.") + end + end else electron_preconditioner_type = Val(:none) end @@ -507,7 +535,7 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, mk_float(t_input["last_fail_proximity_factor"]), mk_float(t_input["minimum_dt"]), mk_float(t_input["maximum_dt"]), electron !== nothing && t_input["implicit_braginskii_conduction"], - implicit_electron_advance, + implicit_electron_advance, implicit_electron_time_evolving, electron !== nothing && t_input["implicit_ion_advance"], electron !== nothing && t_input["implicit_vpa_advection"], implicit_electron_ppar, electron_preconditioner_type, @@ -721,7 +749,7 @@ function setup_time_advance!(pdf, fields, vz, vr, vzeta, vpa, vperp, z, r, gyrop default_rtol=t_params.rtol / 10.0, default_atol=t_params.atol / 10.0) nl_solver_electron_advance_params = - setup_nonlinear_solve(t_params.implicit_electron_advance || composition.electron_physics ∈ (kinetic_electrons, kinetic_electrons_with_temperature_equation), + setup_nonlinear_solve(t_params.implicit_electron_advance || t_params.implicit_electron_time_evolving || t_params.implicit_electron_ppar, input_dict, (z=z, vperp=vperp, vpa=vpa), (r,); @@ -750,9 +778,10 @@ function setup_time_advance!(pdf, fields, vz, vr, vzeta, vpa, vperp, z, r, gyrop error("Cannot use implicit_ion_advance and implicit_vpa_advection at the same " * "time") end - if t_params.implicit_electron_advance && t_params.implicit_electron_ppar - error("Cannot use implicit_electron_advance and implicit_electron_ppar at the " - * "same time.") + if (t_params.implicit_electron_advance + t_params.implicit_electron_time_evolving + + t_params.implicit_electron_ppar) > 1 + error("Can only use one of implicit_electron_advance, " + * "implicit_electron_time_evolving, and implicit_electron_ppar.") end nl_solver_params = (electron_conduction=electron_conduction_nl_solve_parameters, electron_advance=nl_solver_electron_advance_params, @@ -771,9 +800,11 @@ function setup_time_advance!(pdf, fields, vz, vr, vzeta, vpa, vperp, z, r, gyrop # create an array of structs containing scratch arrays for the pdf and low-order moments # that may be evolved separately via fluid equations - scratch = setup_scratch_arrays(moments, pdf, t_params.n_rk_stages + 1) + scratch = setup_scratch_arrays(moments, pdf, t_params.n_rk_stages + 1, + t_params.implicit_electron_time_evolving) if t_params.rk_coefs_implicit !== nothing - scratch_implicit = setup_scratch_arrays(moments, pdf, t_params.n_rk_stages) + scratch_implicit = setup_scratch_arrays(moments, pdf, t_params.n_rk_stages, + t_params.implicit_electron_time_evolving) else scratch_implicit = nothing end @@ -1176,6 +1207,7 @@ function setup_advance_flags(moments, composition, t_params, collisions, advance_continuity = false advance_force_balance = false advance_energy = false + advance_electron_pdf = false advance_electron_energy = false advance_electron_conduction = false advance_neutral_z_advection = false @@ -1299,7 +1331,9 @@ function setup_advance_flags(moments, composition, t_params, collisions, # moment-kinetically then advance the electron energy equation if composition.electron_physics ∈ (kinetic_electrons, kinetic_electrons_with_temperature_equation) - if !(t_params.implicit_electron_advance || t_params.implicit_electron_ppar) + if !(t_params.implicit_electron_advance || + t_params.implicit_electron_time_evolving || + t_params.implicit_electron_ppar) advance_electron_energy = true advance_electron_conduction = true end @@ -1344,8 +1378,8 @@ function setup_advance_flags(moments, composition, t_params, collisions, advance_external_source, advance_ion_numerical_dissipation, advance_neutral_numerical_dissipation, advance_sources, advance_continuity, advance_force_balance, advance_energy, - advance_electron_energy, advance_electron_conduction, - advance_neutral_external_source, + advance_electron_pdf, advance_electron_energy, + advance_electron_conduction, advance_neutral_external_source, advance_neutral_sources, advance_neutral_continuity, advance_neutral_force_balance, advance_neutral_energy, manufactured_solns_test, r_diffusion, vpa_diffusion, @@ -1384,6 +1418,7 @@ function setup_implicit_advance_flags(moments, composition, t_params, collisions advance_continuity = false advance_force_balance = false advance_energy = false + advance_electron_pdf = false advance_electron_energy = false advance_electron_conduction = false advance_neutral_z_advection = false @@ -1458,10 +1493,14 @@ function setup_implicit_advance_flags(moments, composition, t_params, collisions advance_electron_conduction = true end - if (t_params.implicit_electron_advance || t_params.implicit_electron_ppar) + if (t_params.implicit_electron_advance || t_params.implicit_electron_time_evolving || + t_params.implicit_electron_ppar) advance_electron_energy = true advance_electron_conduction = true end + if t_params.implicit_electron_time_evolving + advance_electron_pdf = true + end manufactured_solns_test = manufactured_solns_input.use_for_advance @@ -1476,11 +1515,12 @@ function setup_implicit_advance_flags(moments, composition, t_params, collisions advance_external_source, advance_ion_numerical_dissipation, advance_neutral_numerical_dissipation, advance_sources, advance_continuity, advance_force_balance, advance_energy, - advance_electron_energy, advance_electron_conduction, - advance_neutral_external_source, advance_neutral_sources, - advance_neutral_continuity, advance_neutral_force_balance, - advance_neutral_energy, manufactured_solns_test, r_diffusion, - vpa_diffusion, vperp_diffusion, vz_diffusion) + advance_electron_pdf, advance_electron_energy, + advance_electron_conduction, advance_neutral_external_source, + advance_neutral_sources, advance_neutral_continuity, + advance_neutral_force_balance, advance_neutral_energy, + manufactured_solns_test, r_diffusion, vpa_diffusion, + vperp_diffusion, vz_diffusion) end function setup_dummy_and_buffer_arrays(nr, nz, nvpa, nvperp, nvz, nvr, nvzeta, @@ -1681,7 +1721,7 @@ end create an array of structs containing scratch arrays for the normalised pdf and low-order moments that may be evolved separately via fluid equations """ -function setup_scratch_arrays(moments, pdf, n) +function setup_scratch_arrays(moments, pdf, n, time_evolve_electrons) # will create n structs, each of which will contain one pdf, # density, parallel flow, parallel pressure, and perpendicular pressure array for ions # (possibly) the same for electrons, and the same for neutrals. The actual array will @@ -1690,6 +1730,12 @@ function setup_scratch_arrays(moments, pdf, n) scratch = Vector{scratch_pdf}(undef, n) pdf_dims = size(pdf.ion.norm) moment_dims = size(moments.ion.dens) + + if time_evolve_electrons + pdf_electron_dims = size(pdf.electron.norm) + else + pdf_electron_dims = (0,0,0,0) + end moment_electron_dims = size(moments.electron.dens) pdf_neutral_dims = size(pdf.neutral.norm) @@ -1705,6 +1751,7 @@ function setup_scratch_arrays(moments, pdf, n) pperp_array = allocate_shared_float(moment_dims...) temp_array = allocate_shared_float(moment_dims...) + pdf_electron_array = allocate_shared_float(pdf_electron_dims...) density_electron_array = allocate_shared_float(moment_electron_dims...) upar_electron_array = allocate_shared_float(moment_electron_dims...) ppar_electron_array = allocate_shared_float(moment_electron_dims...) @@ -1719,11 +1766,11 @@ function setup_scratch_arrays(moments, pdf, n) scratch[istage] = scratch_pdf(pdf_array, density_array, upar_array, ppar_array, pperp_array, temp_array, - density_electron_array, upar_electron_array, - ppar_electron_array, pperp_electron_array, - temp_electron_array, pdf_neutral_array, - density_neutral_array, uz_neutral_array, - pz_neutral_array) + pdf_electron_array, density_electron_array, + upar_electron_array, ppar_electron_array, + pperp_electron_array, temp_electron_array, + pdf_neutral_array, density_neutral_array, + uz_neutral_array, pz_neutral_array) @serial_region begin scratch[istage].pdf .= pdf.ion.norm scratch[istage].density .= moments.ion.dens @@ -1731,6 +1778,9 @@ function setup_scratch_arrays(moments, pdf, n) scratch[istage].ppar .= moments.ion.ppar scratch[istage].pperp .= moments.ion.pperp + if time_evolve_electrons + scratch[istage].pdf_electron .= pdf.electron.norm + end scratch[istage].electron_density .= moments.electron.dens scratch[istage].electron_upar .= moments.electron.upar scratch[istage].electron_ppar .= moments.electron.ppar @@ -2423,6 +2473,19 @@ moments and moment derivatives moments, vpa) end end + + if (composition.electron_physics ∈ (kinetic_electrons, + kinetic_electrons_with_temperature_equation) + && length(this_scratch.pdf_electron) > 0) + + for ir ∈ 1:r.n + @views apply_electron_bc_and_constraints_no_r!( + this_scratch.pdf_electron[:,:,:,ir], fields.phi[:,ir], moments, + r, z, vperp, vpa, vperp_spectral, vpa_spectral, + electron_vpa_advect, num_diss_params, composition, ir, + nl_solver_params.electron_advance) + end + end end # update remaining velocity moments that are calculable from the evolved pdf @@ -2654,6 +2717,10 @@ appropriate. begin_s_r_z_region() rk_loworder_solution!(scratch, scratch_implicit, :ppar, t_params) end + if t_params.implicit_electron_time_evolving + begin_r_z_vperp_vpa_region() + rk_loworder_solution!(scratch, scratch_implicit, :pdf_electron, t_params) + end if composition.electron_physics ∈ (braginskii_fluid, kinetic_electrons, kinetic_electrons_with_temperature_equation) begin_r_z_region() @@ -2685,6 +2752,7 @@ appropriate. scratch[t_params.n_rk_stages+1].ppar, scratch[t_params.n_rk_stages+1].pperp, scratch[t_params.n_rk_stages+1].temp_z_s, + scratch[2].pdf_electron, scratch[t_params.n_rk_stages+1].electron_density, scratch[t_params.n_rk_stages+1].electron_upar, scratch[t_params.n_rk_stages+1].electron_ppar, @@ -3018,6 +3086,12 @@ end first_scratch.pperp[iz,ir,is] = moments.ion.pperp[iz,ir,is] end + if length(first_scratch.pdf_electron) > 0 + begin_r_z_vperp_vpa_region() + @loop_r_z_vperp_vpa ir iz ivperp ivpa begin + first_scratch.pdf_electron[ivpa,ivperp,iz,ir] = pdf.electron.norm[ivpa,ivperp,iz,ir] + end + end begin_r_z_region() @loop_r_z ir iz begin first_scratch.electron_density[iz,ir] = moments.electron.dens[iz,ir] @@ -3100,7 +3174,9 @@ end # The result of the implicit solve gives the state vector at 'istage' # which is used as input to the explicit part of the IMEX time step. old_scratch = scratch_implicit[istage] - update_electrons = !(t_params.implicit_electron_advance || t_params.implicit_electron_ppar) + update_electrons = !(t_params.implicit_electron_advance || + t_params.implicit_electron_time_evolving || + t_params.implicit_electron_ppar) bcs_constraints_success = apply_all_bcs_constraints_update_moments!( scratch_implicit[istage], pdf, moments, fields, boundary_distributions, scratch_electron, vz, vr, vzeta, vpa, vperp, @@ -3149,7 +3225,9 @@ end || (istage == n_rk_stages && t_params.implicit_coefficient_is_zero[1]) || t_params.implicit_coefficient_is_zero[istage+1]) update_electrons = (t_params.rk_coefs_implicit === nothing - || !(t_params.implicit_electron_advance || t_params.implicit_electron_ppar)) + || !(t_params.implicit_electron_advance || + t_params.implicit_electron_time_evolving || + t_params.implicit_electron_ppar)) diagnostic_moments = diagnostic_checks && istage == n_rk_stages bcs_constraints_success = apply_all_bcs_constraints_update_moments!( scratch[istage+1], pdf, moments, fields, boundary_distributions, @@ -3172,7 +3250,7 @@ end if t_params.adaptive nl_max_its_fraction = 0.0 - if t_params.implicit_electron_advance + if t_params.implicit_electron_advance || t_params.implicit_electron_time_evolving params_to_check = (nl_solver_params.ion_advance, nl_solver_params.vpa_advection, nl_solver_params.electron_conduction, @@ -3221,6 +3299,9 @@ end t_params.electron.max_step_count_this_ion_step[] = 0 t_params.electron.max_t_increment_this_ion_step[] = 0.0 end + if t_params.implicit_electron_time_evolving + reset_nonlinear_per_stage_counters!(nl_solver_params.electron_advance) + end if t_params.previous_dt[] > 0.0 @@ -3240,6 +3321,12 @@ end end # No need to synchronize here as we only change electron quantities and previous # region only changed ion quantities. + if length(final_scratch.pdf_electron) > 0 + begin_r_z_vperp_vpa_region() + @loop_r_z_vperp_vpa ir iz ivperp ivpa begin + pdf.electron.norm[ivpa,ivperp,iz,ir] = final_scratch.pdf_electron[ivpa,ivperp,iz,ir] + end + end begin_r_z_region(no_synchronize=true) @loop_r_z ir iz begin moments.electron.dens[iz,ir] = final_scratch.electron_density[iz,ir] @@ -3552,6 +3639,18 @@ with fvec_in an input and fvec_out the output z_spectral, composition, external_source_settings.neutral, num_diss_params) end + + if advance.electron_pdf + electron_t_params = (dt=Ref(dt),) + for ir ∈ 1:r.n + @views electron_kinetic_equation_euler_update!( + fvec_out.pdf_electron[:,:,:,ir], fvec_out.electron_ppar[:,ir], + fvec_in.pdf_electron[:,:,:,ir], fvec_in.electron_ppar[:,ir], + moments, z, vperp, vpa, z_spectral, vpa_spectral, z_advect, + vpa_advect, scratch_dummy, collisions, composition, + external_source_settings, num_diss_params, electron_t_params, ir) + end + end if advance.electron_energy electron_energy_equation!(fvec_out.electron_ppar, fvec_in.electron_ppar, fvec_in.density, fvec_in.electron_upar, fvec_in.density, @@ -3607,6 +3706,17 @@ end nl_solver_params.electron_advance) success = success && (electron_success == "") + elseif t_params.implicit_electron_time_evolving + t_params.electron.dt[] = dt + for ir ∈ 1:r.n + electron_success = electron_backward_euler!( + fvec_in, fvec_out, moments, fields.phi, collisions, composition, r, + z, vperp, vpa, z_spectral, vperp_spectral, vpa_spectral, z_advect, + vpa_advect, scratch_dummy, t_params.electron, + external_source_settings, num_diss_params, + nl_solver_params.electron_advance, ir; evolve_ppar=true) + success = success && electron_success + end elseif t_params.implicit_electron_ppar max_electron_pdf_iterations = t_params.electron.max_pseudotimesteps max_electron_sim_time = t_params.electron.max_pseudotime @@ -3938,6 +4048,12 @@ function update_solution_vector!(new_evolved, old_evolved, moments, composition, new_evolved.upar[iz,ir,is] = old_evolved.upar[iz,ir,is] new_evolved.ppar[iz,ir,is] = old_evolved.ppar[iz,ir,is] end + if length(new_evolved.pdf_electron) > 0 + begin_r_z_vperp_vpa_region() + @loop_r_z_vperp_vpa ir iz ivperp ivpa begin + new_evolved.pdf_electron[ivpa,ivperp,iz,ir] = old_evolved.pdf_electron[ivpa,ivperp,iz,ir] + end + end begin_r_z_region() @loop_r_z ir iz begin new_evolved.electron_density[iz,ir] = old_evolved.electron_density[iz,ir] diff --git a/util/precompile_run.jl b/util/precompile_run.jl index a1e3e58ad..d66c9e8e4 100644 --- a/util/precompile_run.jl +++ b/util/precompile_run.jl @@ -111,6 +111,7 @@ kinetic_electron_input = recursive_merge(cheb_input, OptionsDict("evolve_moments "vr" => OptionsDict("ngrid" => 1, "nelement" => 1), "composition" => OptionsDict("electron_physics" => "kinetic_electrons"), + "timestepping" => OptionsDict("type" => "KennedyCarpenterARK324"), "electron_timestepping" => OptionsDict("nstep" => 1, "dt" => 2.0e-11, "initialization_residual_value" => 1.0e10, diff --git a/util/precompile_run_kinetic-electrons.jl b/util/precompile_run_kinetic-electrons.jl index fd3e54ca7..d1b67459e 100644 --- a/util/precompile_run_kinetic-electrons.jl +++ b/util/precompile_run_kinetic-electrons.jl @@ -48,7 +48,8 @@ input = OptionsDict("output" => OptionsDict("run_name" => "precompilation", "bc" => "zero", "L" => 8.0, "discretization" => "gausslegendre_pseudospectral"), - "timestepping" => OptionsDict("nstep" => 1, + "timestepping" => OptionsDict("type" => "KennedyCarpenterARK324", + "nstep" => 1, "dt" => 2.0e-11), "electron_timestepping" => OptionsDict("nstep" => 1, "dt" => 2.0e-11, From e8e88d8b9c12b34b16f84027015337264c434afb Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 7 Dec 2024 21:16:46 +0000 Subject: [PATCH 06/23] Example input with 'time-evolving' electron shape function --- ...enterARK324-time-evolving-ge-wall-Jac.toml | 165 ++++++++++++++++++ 1 file changed, 165 insertions(+) create mode 100644 examples/kinetic-electrons/wall-bc_recyclefraction0.5_split3_kinetic-coarse_tails-KennedyCarpenterARK324-time-evolving-ge-wall-Jac.toml diff --git a/examples/kinetic-electrons/wall-bc_recyclefraction0.5_split3_kinetic-coarse_tails-KennedyCarpenterARK324-time-evolving-ge-wall-Jac.toml b/examples/kinetic-electrons/wall-bc_recyclefraction0.5_split3_kinetic-coarse_tails-KennedyCarpenterARK324-time-evolving-ge-wall-Jac.toml new file mode 100644 index 000000000..659d2ed28 --- /dev/null +++ b/examples/kinetic-electrons/wall-bc_recyclefraction0.5_split3_kinetic-coarse_tails-KennedyCarpenterARK324-time-evolving-ge-wall-Jac.toml @@ -0,0 +1,165 @@ +[r] +ngrid = 1 +nelement = 1 + +[evolve_moments] +parallel_pressure = true +density = true +moments_conservation = true +parallel_flow = true + +[reactions] +electron_ionization_frequency = 0.0 +ionization_frequency = 0.5 +charge_exchange_frequency = 0.75 + +[vz] +ngrid = 6 +discretization = "gausslegendre_pseudospectral" +nelement = 31 +L = 36.0 +element_spacing_option = "coarse_tails" +bc = "zero" + +[ion_species_1] +initial_temperature = 0.1 +initial_density = 1.0 + +[krook_collisions] +use_krook = true + +[vpa] +ngrid = 6 +discretization = "gausslegendre_pseudospectral" +nelement = 31 +L = 30.0 +element_spacing_option = "coarse_tails" +bc = "zero" + +[z] +ngrid = 5 +discretization = "gausslegendre_pseudospectral" +nelement = 32 +nelement_local = 4 +bc = "wall" +element_spacing_option = "sqrt" + +[vpa_IC_ion_species_1] +initialization_option = "gaussian" +density_amplitude = 1.0 +temperature_amplitude = 0.0 +density_phase = 0.0 +upar_amplitude = 0.0 +temperature_phase = 0.0 +upar_phase = 0.0 + +[z_IC_neutral_species_1] +initialization_option = "gaussian" +temperature_amplitude = 0.0 +density_amplitude = 0.001 +density_phase = 0.0 +upar_amplitude = -1.0 +temperature_phase = 0.0 +upar_phase = 0.0 + +[composition] +T_wall = 0.1 +T_e = 0.2 +electron_physics = "kinetic_electrons" +recycling_fraction = 0.5 +n_ion_species = 1 +n_neutral_species = 1 + +[vz_IC_neutral_species_1] +initialization_option = "gaussian" +density_amplitude = 1.0 +temperature_amplitude = 0.0 +density_phase = 0.0 +upar_amplitude = 0.0 +temperature_phase = 0.0 +upar_phase = 0.0 + +[z_IC_ion_species_1] +initialization_option = "gaussian" +density_amplitude = 0.001 +temperature_amplitude = 0.0 +density_phase = 0.0 +upar_amplitude = 1.0 +temperature_phase = 0.0 +upar_phase = 0.0 + +[neutral_species_1] +initial_temperature = 1.0 +initial_density = 1.0 + +[timestepping] +type = "KennedyCarpenterARK324" +implicit_electron_advance = false +implicit_electron_time_evolving=true +implicit_electron_ppar = false +implicit_ion_advance = false +implicit_vpa_advection = false +nstep = 1000000 +dt = 1.0e-5 +nwrite = 10000 +nwrite_dfns = 10000 +steady_state_residual = true +converged_residual_value = 1.0e-3 + +#write_after_fixed_step_count = true +#nstep = 1 +#nwrite = 1 +#nwrite_dfns = 1 + +[electron_timestepping] +nstep = 5000000 +#nstep = 1 +dt = 1.0e-5 +maximum_dt = 2.0e-5 +nwrite = 10000 +nwrite_dfns = 100000 +#type = "SSPRK4" +type = "Fekete4(3)" +rtol = 1.0e-3 +atol = 1.0e-14 +minimum_dt = 1.0e-9 +decrease_dt_iteration_threshold = 50 +increase_dt_iteration_threshold = 20 +cap_factor_ion_dt = 10.0 +initialization_residual_value = 2.5 +converged_residual_value = 1.0e-2 +include_wall_bc_in_preconditioner = true + +#debug_io = 1 + +[nonlinear_solver] +nonlinear_max_iterations = 100 +rtol = 1.0e-6 #1.0e-8 +atol = 1.0e-14 #1.0e-16 +linear_restart = 5 +preconditioner_update_interval = 25 +total_its_soft_limit = 30 +adi_precon_iterations = 3 + +[ion_source_1] +active = true +z_profile = "gaussian" +z_width = 0.125 +source_strength = 2.0 +source_T = 2.0 + +[ion_numerical_dissipation] +#vpa_dissipation_coefficient = 1.0e-1 +#vpa_dissipation_coefficient = 1.0e-2 +#vpa_dissipation_coefficient = 1.0e-3 +force_minimum_pdf_value = 0.0 + +[electron_numerical_dissipation] +vpa_dissipation_coefficient = 2.0 +force_minimum_pdf_value = 0.0 + +[neutral_numerical_dissipation] +#vz_dissipation_coefficient = 1.0e-1 +#vz_dissipation_coefficient = 1.0e-2 +#vz_dissipation_coefficient = 1.0e-3 +force_minimum_pdf_value = 0.0 From 702f436afda8ef332f94474d48ed9e7fa18680ad Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sun, 8 Dec 2024 10:36:41 +0000 Subject: [PATCH 07/23] Enforce maximum_dt in electron_backward_euler_pseudotimestepping!() --- moment_kinetics/src/electron_kinetic_equation.jl | 2 ++ moment_kinetics/test/kinetic_electron_tests.jl | 1 + 2 files changed, 3 insertions(+) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index ebf96ae89..918c40a61 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -883,6 +883,8 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, else t_params.dt[] = min(t_params.dt[] * t_params.max_increase_factor, t_params.cap_factor_ion_dt * ion_dt) end + # Ensure dt does not exceed maximum_dt + t_params.dt[] = min(t_params.dt[], t_params.maximum_dt) end first_step = false diff --git a/moment_kinetics/test/kinetic_electron_tests.jl b/moment_kinetics/test/kinetic_electron_tests.jl index 60ef83ae6..9db8db41d 100644 --- a/moment_kinetics/test/kinetic_electron_tests.jl +++ b/moment_kinetics/test/kinetic_electron_tests.jl @@ -117,6 +117,7 @@ kinetic_input["timestepping"] = OptionsDict("type" => "PareschiRusso2(2,2,2)", kinetic_input["electron_timestepping"] = OptionsDict("nstep" => 5000000, "dt" => 2.0e-5, + "maximum_dt" => Inf, "nwrite" => 10000, "nwrite_dfns" => 100000, "decrease_dt_iteration_threshold" => 5000, From 5de9a6480de587348d0fe7db836c142bae9bb4f3 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sun, 8 Dec 2024 12:15:59 +0000 Subject: [PATCH 08/23] Add adaptive timestep limit for total linear JFNK iterations --- moment_kinetics/src/initial_conditions.jl | 1 + moment_kinetics/src/nonlinear_solvers.jl | 4 +++- moment_kinetics/src/runge_kutta.jl | 12 +++++++----- moment_kinetics/src/time_advance.jl | 12 ++++++++---- 4 files changed, 19 insertions(+), 10 deletions(-) diff --git a/moment_kinetics/src/initial_conditions.jl b/moment_kinetics/src/initial_conditions.jl index 0e7af0346..e5524f296 100644 --- a/moment_kinetics/src/initial_conditions.jl +++ b/moment_kinetics/src/initial_conditions.jl @@ -766,6 +766,7 @@ function initialize_electron_pdf!(scratch, scratch_electron, pdf, moments, field nl_solver_params.electron_advance.serial_solve, nl_solver_params.electron_advance.max_nonlinear_iterations_this_step, nl_solver_params.electron_advance.max_linear_iterations_this_step, + nl_solver_params.electron_advance.total_its_soft_limit, nl_solver_params.electron_advance.preconditioner_type, nl_solver_params.electron_advance.preconditioner_update_interval, nl_solver_params.electron_advance.preconditioners, diff --git a/moment_kinetics/src/nonlinear_solvers.jl b/moment_kinetics/src/nonlinear_solvers.jl index 7ba24ea37..3fc169069 100644 --- a/moment_kinetics/src/nonlinear_solvers.jl +++ b/moment_kinetics/src/nonlinear_solvers.jl @@ -71,6 +71,7 @@ struct nl_solver_info{TH,TV,Tcsg,Tlig,Tprecon,Tpretype} serial_solve::Bool max_nonlinear_iterations_this_step::Base.RefValue{mk_int} max_linear_iterations_this_step::Base.RefValue{mk_int} + total_its_soft_limit::mk_int preconditioner_type::Tpretype preconditioner_update_interval::mk_int preconditioners::Tprecon @@ -98,6 +99,7 @@ function setup_nonlinear_solve(active, input_dict, coords, outer_coords=(); defa linear_restart=10, linear_max_restarts=0, preconditioner_update_interval=300, + total_its_soft_limit=50, adi_precon_iterations=1, ) @@ -278,7 +280,7 @@ function setup_nonlinear_solve(active, input_dict, coords, outer_coords=(); defa Ref(nl_solver_input.preconditioner_update_interval), Ref(mk_float(0.0)), zeros(mk_int, n_vcut_inds), zeros(mk_int, n_vcut_inds), serial_solve, Ref(0), Ref(0), - preconditioner_type, + nl_solver_input.total_its_soft_limit, preconditioner_type, nl_solver_input.preconditioner_update_interval, preconditioners) end diff --git a/moment_kinetics/src/runge_kutta.jl b/moment_kinetics/src/runge_kutta.jl index 772cda8ba..6ea53ba10 100644 --- a/moment_kinetics/src/runge_kutta.jl +++ b/moment_kinetics/src/runge_kutta.jl @@ -1058,15 +1058,17 @@ end """ adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, error_norm_method, success, - nl_max_its_fraction, composition; - electron=false, local_max_dt::mk_float=Inf) + nl_max_its_fraction, nl_total_its_soft_limit, + composition; electron=false, + local_max_dt::mk_float=Inf) Use the calculated `CFL_limits` and `error_norms` to update the timestep in `t_params`. """ function adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, error_norm_method, success, - nl_max_its_fraction, composition; - electron=false, local_max_dt::mk_float=Inf) + nl_max_its_fraction, nl_total_its_soft_limit, + composition; electron=false, + local_max_dt::mk_float=Inf) # Get global minimum of CFL limits CFL_limit = Ref(0.0) this_limit_caused_by = nothing @@ -1325,7 +1327,7 @@ function adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, end end - if nl_max_its_fraction > 0.5 && t_params.previous_dt[] > 0.0 + if (nl_max_its_fraction > 0.5 || nl_total_its_soft_limit) && t_params.previous_dt[] > 0.0 # The last step took many nonlinear iterations, so do not allow the # timestep to increase. # If t_params.previous_dt[]==0.0, then the previous step failed so diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index 97321c142..522c7338b 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -2624,7 +2624,8 @@ end external_source_settings, spectral_objects, advect_objects, gyroavs, num_diss_params, nl_solver_params, advance, scratch_dummy, r, z, vperp, - vpa, vzeta, vr, vz, success, nl_max_its_fraction) + vpa, vzeta, vr, vz, success, nl_max_its_fraction, + nl_total_its_soft_limit) Check the error estimate for the embedded RK method and adjust the timestep if appropriate. @@ -2635,7 +2636,7 @@ appropriate. geometry, external_source_settings, spectral_objects, advect_objects, gyroavs, num_diss_params, nl_solver_params, advance, scratch_dummy, r, z, vperp, vpa, vzeta, vr, vz, success, - nl_max_its_fraction) = begin + nl_max_its_fraction, nl_total_its_soft_limit) = begin #error_norm_method = "Linf" error_norm_method = "L2" @@ -2949,7 +2950,7 @@ appropriate. adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, error_norm_method, success, nl_max_its_fraction, - composition) + nl_total_its_soft_limit, composition) if composition.electron_physics ∈ (kinetic_electrons, kinetic_electrons_with_temperature_equation) @@ -3250,6 +3251,7 @@ end if t_params.adaptive nl_max_its_fraction = 0.0 + nl_total_its_soft_limit = false if t_params.implicit_electron_advance || t_params.implicit_electron_time_evolving params_to_check = (nl_solver_params.ion_advance, nl_solver_params.vpa_advection, @@ -3275,6 +3277,7 @@ end nl_max_its_fraction = max(p.max_nonlinear_iterations_this_step[] / p.nonlinear_max_iterations, nl_max_its_fraction) + nl_total_its_soft_limit = p.max_linear_iterations_this_step[] > p.total_its_soft_limit || nl_total_its_soft_limit end end adaptive_timestep_update!(scratch, scratch_implicit, scratch_electron, @@ -3283,7 +3286,8 @@ end geometry, external_source_settings, spectral_objects, advect_objects, gyroavs, num_diss_params, nl_solver_params, advance, scratch_dummy, r, z, vperp, - vpa, vzeta, vr, vz, success, nl_max_its_fraction) + vpa, vzeta, vr, vz, success, nl_max_its_fraction, + nl_total_its_soft_limit) elseif success != "" error("Implicit part of timestep failed") end From f17a8c4463a2aa0c48ebf76520815e3ad67712f1 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sun, 8 Dec 2024 13:06:53 +0000 Subject: [PATCH 09/23] Fix writing of 'dt' when 'stopnow' is used When the 'stopnow' file is created to immediately stop a run, `t_params.dt_before_output[]` was previously not set, because the `adaptive_timestep_update_t_params!()` function does not know that there is going to be an output triggered by 'stopnow', so 'dt' was written incorrectly. Fix this by setting `t_params.dt_before_output[] = t_params.dt[]` when 'stopnow' is found. --- moment_kinetics/src/time_advance.jl | 1 + 1 file changed, 1 insertion(+) diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index 522c7338b..76c14eda3 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -1928,6 +1928,7 @@ function time_advance!(pdf, scratch, scratch_implicit, scratch_electron, t_para # Stop cleanly if a file called 'stop' was created println("Found 'stopnow' file $(t_params.stopfile * "now"), aborting run") finish_now = true + t_params.dt_before_output[] = t_params.dt[] end if t_params.adaptive && !t_params.write_after_fixed_step_count From ae144d20e380b83f8918ed119f5be32d673b54f9 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Mon, 9 Dec 2024 13:49:33 +0000 Subject: [PATCH 10/23] Comment out line search in Newton iteration The line search seems to just slow down simulations, not make them more robust (which was the hope). It is probably better to just fail faster and decrease the timestep, etc. --- moment_kinetics/src/nonlinear_solvers.jl | 75 ++++++++++++------------ 1 file changed, 38 insertions(+), 37 deletions(-) diff --git a/moment_kinetics/src/nonlinear_solvers.jl b/moment_kinetics/src/nonlinear_solvers.jl index 3fc169069..361547970 100644 --- a/moment_kinetics/src/nonlinear_solvers.jl +++ b/moment_kinetics/src/nonlinear_solvers.jl @@ -478,43 +478,44 @@ old_precon_iterations = nl_solver_params.precon_iterations[] if isnan(residual_norm) error("NaN in Newton iteration at iteration $counter") end - if residual_norm > previous_residual_norm - # Do a line search between x and x+delta_x to try to find an update that does - # decrease residual_norm - s = 0.5 - while s > 1.0e-2 - parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) - residual_func!(residual, x) - residual_norm = distributed_norm(solver_type, residual, norm_params...) - if residual_norm ≤ previous_residual_norm - break - end - s *= 0.5 - end - - #if residual_norm > previous_residual_norm - # # Failed to find a point that decreases the residual, so try a negative - # # step - # s = -1.0e-5 - # parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) - # residual_func!(residual, x) - # residual_norm = distributed_norm(solver_type, residual, norm_params...) - # if residual_norm > previous_residual_norm - # # That didn't work either, so just take the full step and hope for - # # convergence later - # parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) - # residual_func!(residual, x) - # residual_norm = distributed_norm(solver_type, residual, norm_params...) - # end - #end - if residual_norm > previous_residual_norm - # Line search didn't work, so just take the full step and hope for - # convergence later - parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) - residual_func!(residual, x) - residual_norm = distributed_norm(solver_type, residual, norm_params...) - end - end +# if residual_norm > previous_residual_norm +# # Do a line search between x and x+delta_x to try to find an update that does +# # decrease residual_norm +# s = 0.5 +# while s > 1.0e-2 +# parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) +# residual_func!(residual, x) +# residual_norm = distributed_norm(solver_type, residual, norm_params...) +# if residual_norm ≤ previous_residual_norm +# break +# end +# s *= 0.5 +# end +# println("line search s ", s) +# +# #if residual_norm > previous_residual_norm +# # # Failed to find a point that decreases the residual, so try a negative +# # # step +# # s = -1.0e-5 +# # parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) +# # residual_func!(residual, x) +# # residual_norm = distributed_norm(solver_type, residual, norm_params...) +# # if residual_norm > previous_residual_norm +# # # That didn't work either, so just take the full step and hope for +# # # convergence later +# # parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) +# # residual_func!(residual, x) +# # residual_norm = distributed_norm(solver_type, residual, norm_params...) +# # end +# #end +# if residual_norm > previous_residual_norm +# # Line search didn't work, so just take the full step and hope for +# # convergence later +# parallel_map(solver_type, (x,delta_x,s) -> x + s * delta_x, w, x, delta_x, s) +# residual_func!(residual, x) +# residual_norm = distributed_norm(solver_type, residual, norm_params...) +# end +# end parallel_map(solver_type, (w) -> w, x, w) previous_residual_norm = residual_norm From afdf039d6c026108bb9415d6551ad6d5cb39b472 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Tue, 10 Dec 2024 13:02:35 +0000 Subject: [PATCH 11/23] Better interface for loading from `electron_debug` files Give a kwarg, like for `initial_electron`, rather than having to pass the full file path. --- .../src/makie_post_processing.jl | 10 +++++----- moment_kinetics/src/load_data.jl | 20 +++++++++---------- 2 files changed, 15 insertions(+), 15 deletions(-) diff --git a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl index 78ea8b827..b4fcb76b8 100644 --- a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl +++ b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl @@ -847,11 +847,11 @@ end """ get_run_info(run_dir...; itime_min=1, itime_max=0, - itime_skip=1, dfns=false, initial_electron=false, do_setup=true, - setup_input_file=nothing) + itime_skip=1, dfns=false, initial_electron=false, electron_debug=false, + do_setup=true, setup_input_file=nothing) get_run_info((run_dir, restart_index)...; itime_min=1, itime_max=0, - itime_skip=1, dfns=false, initial_electron=false, do_setup=true, - setup_input_file=nothing) + itime_skip=1, dfns=false, initial_electron=false, electron_debug=false, + do_setup=true, setup_input_file=nothing) Get file handles and other info for a single run @@ -874,7 +874,7 @@ mix Strings and Tuples in a call). By default load data from moments files, pass `dfns=true` to load from distribution functions files, or `initial_electron=true` and `dfns=true` to load from initial electron -state files. +state files, or `electron_debug=true` and `dfns=true` to load from electron debug files. The `itime_min`, `itime_max` and `itime_skip` options can be used to select only a slice of time points when loading data. In `makie_post_process` these options are read from the diff --git a/moment_kinetics/src/load_data.jl b/moment_kinetics/src/load_data.jl index b5150c675..67abc3ba7 100644 --- a/moment_kinetics/src/load_data.jl +++ b/moment_kinetics/src/load_data.jl @@ -3349,7 +3349,7 @@ mix Strings and Tuples in a call). By default load data from moments files, pass `dfns=true` to load from distribution functions files, or `initial_electron=true` and `dfns=true` to load from initial electron -state files. +state files, or `electron_debug=true` and `dfns=true` to load from electron debug files. The `itime_min`, `itime_max` and `itime_skip` options can be used to select only a slice of time points when loading data. In `makie_post_process` these options are read from the @@ -3361,18 +3361,22 @@ values are used as offsets from the final time index of the run. """ function get_run_info_no_setup(run_dir::Union{AbstractString,Tuple{AbstractString,Union{Int,Nothing}}}...; itime_min=1, itime_max=0, itime_skip=1, dfns=false, - initial_electron=false) + initial_electron=false, electron_debug=false) if length(run_dir) == 0 error("No run_dir passed") end if initial_electron && !dfns error("When `initial_electron=true` is passed, `dfns=true` must also be passed") end + if electron_debug && !dfns + error("When `electron_debug=true` is passed, `dfns=true` must also be passed") + end if length(run_dir) > 1 run_info = Tuple(get_run_info_no_setup(r; itime_min=itime_min, itime_max=itime_max, itime_skip=itime_skip, dfns=dfns, - initial_electron=initial_electron) + initial_electron=initial_electron, + electron_debug=electron_debug) for r ∈ run_dir) return run_info end @@ -3393,7 +3397,6 @@ function get_run_info_no_setup(run_dir::Union{AbstractString,Tuple{AbstractStrin * "`(String, Nothing)`. Got $run_dir") end - electron_debug = false if isfile(this_run_dir) # this_run_dir is actually a filename. Assume it is a moment_kinetics output file # and infer the directory and the run_name from the filename. @@ -3409,7 +3412,6 @@ function get_run_info_no_setup(run_dir::Union{AbstractString,Tuple{AbstractStrin run_name = split(filename, ".initial_electron.")[1] elseif occursin(".electron_debug.", filename) run_name = split(filename, ".electron_debug.")[1] - electron_debug = true else error("Cannot recognise '$this_run_dir/$filename' as a moment_kinetics output file") end @@ -3471,11 +3473,9 @@ function get_run_info_no_setup(run_dir::Union{AbstractString,Tuple{AbstractStrin end if initial_electron - if electron_debug - ext = "electron_debug" - else - ext = "initial_electron" - end + ext = "initial_electron" + elseif electron_debug + ext = "electron_debug" elseif dfns ext = "dfns" else From 2f0eb67ed83a1db915c70c4ef67c9079b119f095 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Wed, 11 Dec 2024 20:54:54 +0000 Subject: [PATCH 12/23] Impose maxima on initial electron dt --- moment_kinetics/src/time_advance.jl | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index 76c14eda3..e1f1d3fce 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -517,6 +517,15 @@ function setup_time_info(t_input, n_variables, code_time, dt_reload, max_pseudotime = Inf include_wall_bc_in_preconditioner = false electron_t_params = electron + + # Check maximum dt for electrons + if rk_coefs_implicit !== nothing + electron.dt[] = min(electron.dt[], electron.maximum_dt, + electron.cap_factor_ion_dt * dt[] * rk_coefs_implicit[1,1]) + else + electron.dt[] = min(electron.dt[], electron.maximum_dt) + end + electron.previous_dt[] = electron.dt[] end return time_info(n_variables, t_input["nstep"], end_time, t, dt, previous_dt, dt_before_output, dt_before_last_fail, mk_float(CFL_prefactor), From c8328faab85e4079966f7c2d739f65f710d159d9 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Fri, 13 Dec 2024 17:32:21 +0000 Subject: [PATCH 13/23] Fix selection of time slices used for animation titles --- .../src/makie_post_processing.jl | 30 ++++++++++++++----- 1 file changed, 22 insertions(+), 8 deletions(-) diff --git a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl index b4fcb76b8..b09bc184d 100644 --- a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl +++ b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl @@ -1945,11 +1945,11 @@ for dim ∈ one_dimension_combinations_no_t all(isapprox.(ri.time, run_info[1].time)) for ri ∈ run_info[2:end]) # All times are the same - time = select_slice(run_info[1].time, :t; input=input, it=it) + time = select_time_slice(run_info[1].time, it) title = lift(i->string("t = ", time[i]), frame_index) else title = lift(i->join((string("t", irun, " = ", - select_slice(ri.time, :t; input=input, it=it)[i]) + select_time_slice(ri.time, it)[i]) for (irun,ri) ∈ enumerate(run_info)), "; "), frame_index) end @@ -2038,7 +2038,7 @@ for dim ∈ one_dimension_combinations_no_t ind = frame_index end if ax === nothing - time = select_slice(run_info.time, :t; input=input, it=it) + time = select_time_slice(run_info.time, it) title = lift(i->string("t = ", time[i]), ind) fig, ax = get_1d_ax(; xlabel="$($dim_str)", ylabel=get_variable_symbol(var_name), @@ -2188,13 +2188,13 @@ for (dim1, dim2) ∈ two_dimension_combinations_no_t if length(run_info) > 1 title = get_variable_symbol(var_name) subtitles = (lift(i->string(ri.run_name, "\nt = ", - select_slice(ri.time, :t; input=input, it=it)[i]), + select_time_slice(ri.time, it)[i]), frame_index) for ri ∈ run_info) else - time = select_slice(run_info[1].time, :t; input=input, it=it) + time = select_time_slice(run_info[1].time, it) title = lift(i->string(get_variable_symbol(var_name), "\nt = ", - run_info[1].time[i]), + time[i]), frame_index) subtitles = nothing end @@ -2276,9 +2276,9 @@ for (dim1, dim2) ∈ two_dimension_combinations_no_t colormap = input.colormap end if title === nothing && ax == nothing - time = select_slice(run_info.time, :t; input=input, it=it) + time = select_time_slice(run_info.time, it) title = lift(i->string(get_variable_symbol(var_name), "\nt = ", - run_info.time[i]), + time[i]), ind) end @@ -3514,6 +3514,20 @@ function select_slice(variable::AbstractArray{T,7}, dims::Symbol...; input=nothi return slice end +""" + select_time_slice(time::AbstractVector, range) + +Variant of `select_slice()` to be used on 'time' arrays, which are always 1D. +""" +function select_time_slice(time::AbstractVector, range) + if range === nothing + return time + else + return @view time[range] + end +end + + """ get_dimension_slice_indices(keep_dims...; input, it=nothing, is=nothing, ir=nothing, iz=nothing, ivperp=nothing, ivpa=nothing, From 825b1eb0e208b253faec9254ee20ce2ad3646164 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Fri, 13 Dec 2024 17:33:27 +0000 Subject: [PATCH 14/23] Put legends below plots, and ensure they do not squash the plots --- .../src/makie_post_processing.jl | 230 +++++++++++++++--- 1 file changed, 197 insertions(+), 33 deletions(-) diff --git a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl index b09bc184d..4f4dcbcc9 100644 --- a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl +++ b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl @@ -1528,7 +1528,11 @@ for dim ∈ one_dimension_combinations end if n_runs > 1 - put_legend_above(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) end if outfile !== nothing @@ -1975,7 +1979,11 @@ for dim ∈ one_dimension_combinations_no_t end if n_runs > 1 - put_legend_above(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) end if it === nothing @@ -3903,7 +3911,11 @@ function plot_f_unnorm_vs_vpa(run_info::Tuple; f_over_vpa2=false, electron=false end if n_runs > 1 - put_legend_above(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) end if outfile !== nothing @@ -4265,7 +4277,11 @@ function animate_f_unnorm_vs_vpa(run_info::Tuple; f_over_vpa2=false, electron=fa end if n_runs > 1 - put_legend_above(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) end if outfile !== nothing @@ -4698,7 +4714,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) label="$(run_label)iz=$iz", ax=ax) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf$(electron_suffix)_$(label)_vs_vpa.pdf" save(outfile, fig) @@ -4715,7 +4735,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf$(electron_suffix)_$(label)_vs_vpa.pdf" save(outfile, fig) @@ -4732,7 +4756,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) label="$(run_label)iz=$iz", ax=ax) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf_unnorm_$(label)_vs_vpa.pdf" save(outfile, fig) @@ -4749,7 +4777,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf_unnorm_$(label)_vs_vpa.pdf" save(outfile, fig) end @@ -4790,7 +4822,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) frame_index=frame_index) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf$(electron_suffix)_$(label)_vs_vpa." * input.animation_ext save_animation(fig, frame_index, nt, outfile) @@ -4809,7 +4845,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf$(electron_suffix)_$(label)_vs_vpa." * input.animation_ext save_animation(fig, frame_index, nt, outfile) @@ -4828,7 +4868,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) frame_index=frame_index) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf_unnorm_$(label)_vs_vpa." * input.animation_ext save_animation(fig, frame_index, nt, outfile) @@ -4847,7 +4891,11 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf_unnorm_$(label)_vs_vpa." * input.animation_ext save_animation(fig, frame_index, nt, outfile) end @@ -4953,7 +5001,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) label="$(run_label)iz=$iz", ax=ax) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf_neutral_$(label)_vs_vz.pdf" save(outfile, fig) @@ -4970,7 +5022,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf_neutral_$(label)_vs_vpa.pdf" save(outfile, fig) @@ -4988,7 +5044,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) ax=ax) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf_neutral_unnorm_$(label)_vs_vpa.pdf" save(outfile, fig) @@ -5006,7 +5066,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf_neutral_unnorm_$(label)_vs_vpa.pdf" save(outfile, fig) end @@ -5065,7 +5129,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) frame_index=frame_index) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf_neutral_$(label)_vs_vz." * input.animation_ext save_animation(fig, frame_index, nt, outfile) @@ -5084,7 +5152,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf_neutral_$(label)_vs_vz." * input.animation_ext save_animation(fig, frame_index, nt, outfile) @@ -5104,7 +5176,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) frame_index=frame_index) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "pdf_neutral_unnorm_$(label)_vs_vz." * input.animation_ext save_animation(fig, frame_index, nt, outfile) @@ -5123,7 +5199,11 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) transform=(x)->positive_or_nan(x; epsilon=1.e-20)) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile=plot_prefix * "logpdf_neutral_unnorm_$(label)_vs_vz." * input.animation_ext save_animation(fig, frame_index, nt, outfile) end @@ -5248,7 +5328,11 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) input=input) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) save(plot_prefix * "ion_constraints.pdf", fig) end @@ -5292,7 +5376,11 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) input=input) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) save(plot_prefix * "neutral_constraints.pdf", fig) end @@ -5325,7 +5413,11 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) # plot_vs_z(ri, varname; label=label, ax=ax, it=it0, ir=ir0, # input=input) # end - # put_legend_right(fig, ax) + # put_legend_below(fig, ax) + # # Ensure the first row width is 3/4 of the column width so that + # # the plot does not get squashed by the legend + # rowsize!(fig.layout, 1, Aspect(1, 3/4)) + # resize_to_layout!(fig) # save(plot_prefix * "electron_constraints.pdf", fig) #end end @@ -5390,7 +5482,11 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) input=input) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) ylims!(ax, ymin, ymax) save_animation(fig, frame_index, nt, plot_prefix * "ion_constraints." * input.animation_ext) @@ -5454,7 +5550,11 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) input=input) end end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) ylims!(ax, ymin, ymax) save_animation(fig, frame_index, nt, plot_prefix * "neutral_constraints." * input.animation_ext) @@ -5505,7 +5605,11 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) # animate_vs_z(ri, varname; label=label, data=data, # frame_index=frame_index, ax=ax, ir=ir0, input=input) # end - # put_legend_right(fig, ax) + # put_legend_below(fig, ax) + # # Ensure the first row width is 3/4 of the column width so that + # # the plot does not get squashed by the legend + # rowsize!(fig.layout, 1, Aspect(1, 3/4)) + # resize_to_layout!(fig) # ylims!(ax, ymin, ymax) # save_animation(fig, frame_index, nt, # plot_prefix * "electron_constraints." * input.animation_ext) @@ -5695,12 +5799,20 @@ function Chodura_condition_plots(run_info::Tuple; plot_prefix) fig = figs[1] ax = axes[1][1] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "Chodura_ratio_lower_vs_t.pdf") save(outfile, fig) fig = figs[2] ax = axes[1][2] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "Chodura_ratio_upper_vs_t.pdf") save(outfile, fig) end @@ -5708,12 +5820,20 @@ function Chodura_condition_plots(run_info::Tuple; plot_prefix) fig = figs[3] ax = axes[1][3] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "Chodura_ratio_lower_vs_r.pdf") save(outfile, fig) fig = figs[4] ax = axes[1][4] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "Chodura_ratio_upper_vs_r.pdf") save(outfile, fig) end @@ -5731,12 +5851,20 @@ function Chodura_condition_plots(run_info::Tuple; plot_prefix) println("check axes ", axes) ax = axes[1][7] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "pdf_unnorm_over_vpa2_wall-_vs_vpa.pdf") save(outfile, fig) fig = figs[8] ax = axes[1][8] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "pdf_unnorm_over_vpa2_wall+_vs_vpa.pdf") save(outfile, fig) end @@ -5747,6 +5875,10 @@ function Chodura_condition_plots(run_info::Tuple; plot_prefix) ax = axes[1][9][1] frame_index = axes[1][9][2] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "pdf_unnorm_over_vpa2_wall-_vs_vpa." * input.animation_ext) save_animation(fig, frame_index, nt, outfile) @@ -5754,6 +5886,10 @@ function Chodura_condition_plots(run_info::Tuple; plot_prefix) ax = axes[1][10][1] frame_index = axes[1][10][2] put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) outfile = string(plot_prefix, "pdf_unnorm_over_vpa2_wall+_vs_vpa." * input.animation_ext) save_animation(fig, frame_index, nt, outfile) end @@ -6038,7 +6174,11 @@ function sound_wave_plots(run_info::Tuple; plot_prefix) end if input.plot - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) save(outfile, fig) @@ -6106,7 +6246,11 @@ function sound_wave_plots(run_info; outfile=nothing, ax=nothing, phi=nothing) error("Cannot save figure from this function when `ax` was passed. Please " * "save the figure that contains `ax`") end - put_legend_right(fig, ax) + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) save(outfile, fig) end end @@ -7788,7 +7932,11 @@ function timestep_diagnostics(run_info, run_info_dfns; plot_prefix=nothing, it=n end end - put_legend_right(steps_fig, ax_failures) + put_legend_below(steps_fig, ax_failures) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(steps_fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(steps_fig) if plot_prefix !== nothing outfile = plot_prefix * electron_prefix * "timestep_diagnostics.pdf" @@ -7886,7 +8034,11 @@ function timestep_diagnostics(run_info, run_info_dfns; plot_prefix=nothing, it=n end end #ylims!(ax, 0.0, 10.0 * maxval) - put_legend_right(CFL_fig, ax) + put_legend_below(CFL_fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(CFL_fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(CFL_fig) if plot_prefix !== nothing outfile = plot_prefix * electron_prefix * "CFL_factors.pdf" @@ -8053,7 +8205,11 @@ function timestep_diagnostics(run_info, run_info_dfns; plot_prefix=nothing, it=n end end - put_legend_right(limits_fig, ax) + put_legend_below(limits_fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(limits_fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(limits_fig) if plot_prefix !== nothing outfile = plot_prefix * electron_prefix * "timestep_limits.pdf" @@ -8102,7 +8258,11 @@ function timestep_diagnostics(run_info, run_info_dfns; plot_prefix=nothing, it=n end if has_nl_solver - put_legend_right(nl_solvers_fig, ax) + put_legend_below(nl_solvers_fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(nl_solvers_fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(nl_solvers_fig) if plot_prefix !== nothing outfile = plot_prefix * "nonlinear_solver_iterations.pdf" @@ -8143,7 +8303,11 @@ function timestep_diagnostics(run_info, run_info_dfns; plot_prefix=nothing, it=n end if has_electron_solve - put_legend_right(electron_solver_fig, ax) + put_legend_below(electron_solver_fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(electron_solver_fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(electron_solver_fig) if has_electron_solve outfile = plot_prefix * "electron_steps.pdf" From 3c3049845ff988e88d5c12d78d7a7e63dea89f4e Mon Sep 17 00:00:00 2001 From: John Omotani Date: Fri, 13 Dec 2024 18:13:53 +0000 Subject: [PATCH 15/23] Save local pseudo-time, residual in electron initialisation/debug output --- .../src/electron_kinetic_equation.jl | 30 ++++++++++++++----- moment_kinetics/src/file_io.jl | 20 +++++++++++-- moment_kinetics/src/initial_conditions.jl | 4 +-- 3 files changed, 43 insertions(+), 11 deletions(-) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 918c40a61..ad5f39be2 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -334,12 +334,17 @@ function update_electron_pdf_with_time_advance!(scratch, pdf, moments, phi, coll end end + # Counter for pseudotime just in this pseudotimestepping loop + local_pseudotime = 0.0 + residual_norm = -1.0 + begin_serial_region() t_params.moments_output_counter[] += 1 @serial_region begin if io_electron !== nothing write_electron_state(scratch, moments, t_params, io_electron, - t_params.moments_output_counter[], r, z, vperp, vpa) + t_params.moments_output_counter[], local_pseudotime, 0.0, + r, z, vperp, vpa) end end # evolve (artificially) in time until the residual is less than the tolerance @@ -484,6 +489,7 @@ function update_electron_pdf_with_time_advance!(scratch, pdf, moments, phi, coll # update the time following the pdf update t_params.t[] += t_params.previous_dt[] + local_pseudotime += t_params.previous_dt[] residual = -1.0 if t_params.previous_dt[] > 0.0 @@ -573,7 +579,8 @@ function update_electron_pdf_with_time_advance!(scratch, pdf, moments, phi, coll if io_electron !== nothing t_params.write_moments_output[] = false write_electron_state(scratch, moments, t_params, io_electron, - t_params.moments_output_counter[], r, z, vperp, + t_params.moments_output_counter[], + local_pseudotime, residual_norm, r, z, vperp, vpa) end end @@ -623,7 +630,8 @@ function update_electron_pdf_with_time_advance!(scratch, pdf, moments, phi, coll if io_electron !== nothing && io_electron !== true t_params.moments_output_counter[] += 1 write_electron_state(scratch, moments, t_params, io_electron, - t_params.moments_output_counter[], r, z, vperp, vpa) + t_params.moments_output_counter[], local_pseudotime, + residual_norm, r, z, vperp, vpa) finish_electron_io(io_electron) end end @@ -752,12 +760,17 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, initial_step_counter = t_params.step_counter[] t_params.step_counter[] += 1 + # Pseudotime just in this pseudotimestepping loop + local_pseudotime = 0.0 + residual_norm = -1.0 + begin_serial_region() t_params.moments_output_counter[] += 1 @serial_region begin if io_electron !== nothing write_electron_state(scratch, moments, t_params, io_electron, - t_params.moments_output_counter[], r, z, vperp, vpa) + t_params.moments_output_counter[], local_pseudotime, 0.0, + r, z, vperp, vpa) end end electron_pdf_converged = Ref(false) @@ -833,6 +846,7 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, #println("Newton its ", nl_solver_params.max_nonlinear_iterations_this_step[], " ", t_params.dt[]) # update the time following the pdf update t_params.t[] += t_params.dt[] + local_pseudotime += t_params.dt[] if first_step && !reduced_by_ion_dt # Adjust t_params.previous_dt[] which gives the initial timestep for @@ -1000,8 +1014,9 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, if io_electron !== nothing t_params.write_moments_output[] = false write_electron_state(scratch, moments, t_params, io_electron, - t_params.moments_output_counter[], r, z, vperp, - vpa) + t_params.moments_output_counter[], + local_pseudotime, residual_norm, r, z, + vperp, vpa) end end end @@ -1040,7 +1055,8 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, if io_electron !== nothing && io_electron !== true t_params.moments_output_counter[] += 1 write_electron_state(scratch, moments, t_params, io_electron, - t_params.moments_output_counter[], r, z, vperp, vpa) + t_params.moments_output_counter[], local_pseudotime, + residual_norm, r, z, vperp, vpa) finish_electron_io(io_electron) end end diff --git a/moment_kinetics/src/file_io.jl b/moment_kinetics/src/file_io.jl index e64c8c9f9..b946e4ce9 100644 --- a/moment_kinetics/src/file_io.jl +++ b/moment_kinetics/src/file_io.jl @@ -320,8 +320,12 @@ struct io_initial_electron_info{Tfile, Tfe, Tmom, Texte1, Texte2, Texte3, Texte4 electron_constraints_C_coefficient::Tconstr # cumulative number of electron pseudo-timesteps taken electron_step_counter::Telectronint + # local electron pseudo-time + electron_local_pseudotime::Telectrontime # cumulative electron pseudo-time electron_cumulative_pseudotime::Telectrontime + # current residual for the electron pseudo-timestepping loop + electron_residual::Telectrontime # current electron pseudo-timestep size electron_dt::Telectrontime # size of last electron pseudo-timestep before the output was written @@ -533,6 +537,10 @@ function setup_electron_io(io_input, vpa, vperp, z, r, composition, collisions, io_pseudotime = create_dynamic_variable!(dynamic, "time", mk_float; parallel_io=parallel_io, description="pseudotime used for electron initialization") + io_local_pseudotime = create_dynamic_variable!(dynamic, "electron_local_pseudotime", mk_float; parallel_io=parallel_io, + description="pseudotime within a single pseudotimestepping loop") + io_electron_residual = create_dynamic_variable!(dynamic, "electron_residual", mk_float; parallel_io=parallel_io, + description="residual for electron pseudotimestepping loop") io_f_electron = create_dynamic_variable!(dynamic, "f_electron", mk_float, vpa, vperp, z, r; parallel_io=parallel_io, @@ -642,7 +650,9 @@ function reopen_initial_electron_io(file_info) getvar("electron_constraints_B_coefficient"), getvar("electron_constraints_C_coefficient"), getvar("electron_step_counter"), + getvar("electron_local_pseudotime"), getvar("electron_cumulative_pseudotime"), + getvar("electron_residual"), getvar("electron_dt"), getvar("electron_previous_dt"), getvar("electron_failure_counter"), @@ -3386,12 +3396,14 @@ end """ write_electron_state(scratch_electron, moments, t_params, io_initial_electron, - t_idx, r, z, vperp, vpa; pdf_electron_converged=false) + t_idx, local_pseudotime, electron_residual, r, z, vperp, vpa; + pdf_electron_converged=false) Write the electron state to an output file. """ function write_electron_state(scratch_electron, moments, t_params, - io_or_file_info_initial_electron, t_idx, r, z, vperp, vpa; + io_or_file_info_initial_electron, t_idx, local_pseudotime, + electron_residual, r, z, vperp, vpa; pdf_electron_converged=false) @serial_region begin @@ -3410,8 +3422,12 @@ function write_electron_state(scratch_electron, moments, t_params, # add the pseudo-time for this time slice to the hdf5 file append_to_dynamic_var(io_initial_electron.time, t_params.t[], t_idx, parallel_io) + append_to_dynamic_var(io_initial_electron.electron_local_pseudotime, local_pseudotime, + t_idx, parallel_io) append_to_dynamic_var(io_initial_electron.electron_cumulative_pseudotime, t_params.t[], t_idx, parallel_io) + append_to_dynamic_var(io_initial_electron.electron_residual, electron_residual, + t_idx, parallel_io) write_electron_dfns_data_to_binary(nothing, scratch_electron, t_params, io_initial_electron, t_idx, r, z, vperp, vpa) diff --git a/moment_kinetics/src/initial_conditions.jl b/moment_kinetics/src/initial_conditions.jl index e5524f296..59cb15035 100644 --- a/moment_kinetics/src/initial_conditions.jl +++ b/moment_kinetics/src/initial_conditions.jl @@ -807,8 +807,8 @@ function initialize_electron_pdf!(scratch, scratch_electron, pdf, moments, field t_params.electron.moments_output_counter[] += 1 write_electron_state(scratch_electron, moments, t_params.electron, io_initial_electron, - t_params.electron.moments_output_counter[], r, z, vperp, - vpa; pdf_electron_converged=true) + t_params.electron.moments_output_counter[], -1.0, 0.0, r, + z, vperp, vpa; pdf_electron_converged=true) finish_electron_io(io_initial_electron) end From 1457bf0d4eab82fba3b6773c986bfcc6ff9fe923 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 14 Dec 2024 14:34:05 +0000 Subject: [PATCH 16/23] Make number of extra z-points near wall settable in wall_plots Line plots vs. w_parallel or v_parallel plot curves for some additional points near the wall. This commit allows the number of those points to be set in the input file. --- .../src/makie_post_processing.jl | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl index 4f4dcbcc9..af0450022 100644 --- a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl +++ b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl @@ -723,6 +723,7 @@ function _setup_single_input!(this_input_dict::OrderedDict{String,Any}, advection_velocity=false, colormap=this_input_dict["colormap"], animation_ext=this_input_dict["animation_ext"], + n_points_near_wall=4, ) set_defaults_and_check_section!( @@ -732,6 +733,7 @@ function _setup_single_input!(this_input_dict::OrderedDict{String,Any}, advection_velocity=false, colormap=this_input_dict["colormap"], animation_ext=this_input_dict["animation_ext"], + n_points_near_wall=4, ) set_defaults_and_check_section!( @@ -741,6 +743,7 @@ function _setup_single_input!(this_input_dict::OrderedDict{String,Any}, advection_velocity=false, colormap=this_input_dict["colormap"], animation_ext=this_input_dict["animation_ext"], + n_points_near_wall=4, ) set_defaults_and_check_section!( @@ -4696,8 +4699,8 @@ function plot_charged_pdf_2D_at_wall(run_info; plot_prefix, electron=false) nt = minimum(ri.nt for ri ∈ run_info) - for (z, z_range, label) ∈ ((z_lower, z_lower:z_lower+4, "wall-"), - (z_upper, z_upper-4:z_upper, "wall+")) + for (z, z_range, label) ∈ ((z_lower, z_lower:z_lower+input.n_points_near_wall, "wall-"), + (z_upper, z_upper-input.n_points_near_wall:z_upper, "wall+")) f_input = copy(input_dict_dfns["f"]) f_input["iz0"] = z @@ -4983,8 +4986,8 @@ function plot_neutral_pdf_2D_at_wall(run_info; plot_prefix) for ri ∈ run_info) nt = minimum(ri.nt for ri ∈ run_info) - for (z, z_range, label) ∈ ((z_lower, z_lower:z_lower+4, "wall-"), - (z_upper, z_upper-4:z_upper, "wall+")) + for (z, z_range, label) ∈ ((z_lower, z_lower:z_lower+input.n_points_near_wall, "wall-"), + (z_upper, z_upper-input.n_points_near_wall:z_upper, "wall+")) f_neutral_input = copy(input_dict_dfns["f_neutral"]) f_neutral_input["iz0"] = z From c2d12abd3b1572315d2bf0a95876ab3466fd664a Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 14 Dec 2024 23:37:37 +0000 Subject: [PATCH 17/23] Enable neutral and electron constraints plots The neutral plots were deactivated by a bug. The electron plots were commented out, but can be made now. --- .../src/makie_post_processing.jl | 180 +++++++++--------- 1 file changed, 90 insertions(+), 90 deletions(-) diff --git a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl index af0450022..b3c6d96e9 100644 --- a/makie_post_processing/makie_post_processing/src/makie_post_processing.jl +++ b/makie_post_processing/makie_post_processing/src/makie_post_processing.jl @@ -5340,7 +5340,7 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) end # Neutrals - if any(ri.n_neutral_species > 1 + if any(ri.n_neutral_species > 0 && (ri.evolve_density || ri.evolve_upar || ri.evolve_ppar) for ri ∈ run_info) @@ -5388,41 +5388,41 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) end # Electrons - #if any(ri.composition.electron_physics ∈ (kinetic_electrons, - # kinetic_electrons_with_temperature_equation) - # for ri ∈ run_info) - - # fig, ax = get_1d_ax(; xlabel="z", ylabel="constraint coefficient") - # for ri ∈ run_info - # if length(run_info) > 1 - # prefix = ri.run_name * ", " - # else - # prefix = "" - # end - - # varname = "electron_constraints_A_coefficient" - # label = prefix * "(A-1)" - # data = get_variable(ri, varname; it=it0, ir=ir0) - # data .-= 1.0 - # plot_vs_z(ri, varname; label=label, data=data, ax=ax, input=input) - - # varname = "electron_constraints_B_coefficient" - # label = prefix * "B" - # plot_vs_z(ri, varname; label=label, ax=ax, it=it0, ir=ir0, - # input=input) - - # varname = "electron_constraints_C_coefficient" - # label = prefix * "C" - # plot_vs_z(ri, varname; label=label, ax=ax, it=it0, ir=ir0, - # input=input) - # end - # put_legend_below(fig, ax) - # # Ensure the first row width is 3/4 of the column width so that - # # the plot does not get squashed by the legend - # rowsize!(fig.layout, 1, Aspect(1, 3/4)) - # resize_to_layout!(fig) - # save(plot_prefix * "electron_constraints.pdf", fig) - #end + if any(ri.composition.electron_physics ∈ (kinetic_electrons, + kinetic_electrons_with_temperature_equation) + for ri ∈ run_info) + + fig, ax = get_1d_ax(; xlabel="z", ylabel="constraint coefficient") + for ri ∈ run_info + if length(run_info) > 1 + prefix = ri.run_name * ", " + else + prefix = "" + end + + varname = "electron_constraints_A_coefficient" + label = prefix * "(A-1)" + data = get_variable(ri, varname; it=it0, ir=ir0) + data .-= 1.0 + plot_vs_z(ri, varname; label=label, data=data, ax=ax, input=input) + + varname = "electron_constraints_B_coefficient" + label = prefix * "B" + plot_vs_z(ri, varname; label=label, ax=ax, it=it0, ir=ir0, + input=input) + + varname = "electron_constraints_C_coefficient" + label = prefix * "C" + plot_vs_z(ri, varname; label=label, ax=ax, it=it0, ir=ir0, + input=input) + end + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) + save(plot_prefix * "electron_constraints.pdf", fig) + end end if input.animate @@ -5496,7 +5496,7 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) end # Neutrals - if any(ri.n_neutral_species > 1 + if any(ri.n_neutral_species > 0 && (ri.evolve_density || ri.evolve_upar || ri.evolve_ppar) for ri ∈ run_info) @@ -5564,59 +5564,59 @@ function constraints_plots(run_info; plot_prefix=plot_prefix) end # Electrons - #if any(ri.composition.electron_physics ∈ (kinetic_electrons, - # kinetic_electrons_with_temperature_equation) - # for ri ∈ run_info) - - # frame_index = Observable(1) - # fig, ax = get_1d_ax(; xlabel="z", ylabel="constraint coefficient") - - # # Calculate plot limits manually so we can exclude the first time point, which - # # often has a large value for (A-1) due to the way initialisation is done, - # # which can make the subsequent values hard to see. - # ymin = Inf - # ymax = -Inf - # for ri ∈ run_info - # if length(run_info) > 1 - # prefix = ri.run_name * ", " - # else - # prefix = "" - # end - - # varname = "electron_constraints_A_coefficient" - # label = prefix * "(A-1)" - # data = get_variable(ri, varname; ir=ir0) - # data .-= 1.0 - # ymin = min(ymin, minimum(data[:,2:end])) - # ymax = max(ymax, maximum(data[:,2:end])) - # animate_vs_z(ri, varname; label=label, data=data, - # frame_index=frame_index, ax=ax, input=input) - - # varname = "electron_constraints_B_coefficient" - # label = prefix * "B" - # data = get_variable(ri, varname; ir=ir0) - # ymin = min(ymin, minimum(data[:,2:end])) - # ymax = max(ymax, maximum(data[:,2:end])) - # animate_vs_z(ri, varname; label=label, data=data, - # frame_index=frame_index, ax=ax, ir=ir0, input=input) - - # varname = "electron_constraints_C_coefficient" - # label = prefix * "C" - # data = get_variable(ri, varname; ir=ir0) - # ymin = min(ymin, minimum(data[:,2:end])) - # ymax = max(ymax, maximum(data[:,2:end])) - # animate_vs_z(ri, varname; label=label, data=data, - # frame_index=frame_index, ax=ax, ir=ir0, input=input) - # end - # put_legend_below(fig, ax) - # # Ensure the first row width is 3/4 of the column width so that - # # the plot does not get squashed by the legend - # rowsize!(fig.layout, 1, Aspect(1, 3/4)) - # resize_to_layout!(fig) - # ylims!(ax, ymin, ymax) - # save_animation(fig, frame_index, nt, - # plot_prefix * "electron_constraints." * input.animation_ext) - #end + if any(ri.composition.electron_physics ∈ (kinetic_electrons, + kinetic_electrons_with_temperature_equation) + for ri ∈ run_info) + + frame_index = Observable(1) + fig, ax = get_1d_ax(; xlabel="z", ylabel="constraint coefficient") + + # Calculate plot limits manually so we can exclude the first time point, which + # often has a large value for (A-1) due to the way initialisation is done, + # which can make the subsequent values hard to see. + ymin = Inf + ymax = -Inf + for ri ∈ run_info + if length(run_info) > 1 + prefix = ri.run_name * ", " + else + prefix = "" + end + + varname = "electron_constraints_A_coefficient" + label = prefix * "(A-1)" + data = get_variable(ri, varname; ir=ir0) + data .-= 1.0 + ymin = min(ymin, minimum(data[:,2:end])) + ymax = max(ymax, maximum(data[:,2:end])) + animate_vs_z(ri, varname; label=label, data=data, + frame_index=frame_index, ax=ax, input=input) + + varname = "electron_constraints_B_coefficient" + label = prefix * "B" + data = get_variable(ri, varname; ir=ir0) + ymin = min(ymin, minimum(data[:,2:end])) + ymax = max(ymax, maximum(data[:,2:end])) + animate_vs_z(ri, varname; label=label, data=data, + frame_index=frame_index, ax=ax, ir=ir0, input=input) + + varname = "electron_constraints_C_coefficient" + label = prefix * "C" + data = get_variable(ri, varname; ir=ir0) + ymin = min(ymin, minimum(data[:,2:end])) + ymax = max(ymax, maximum(data[:,2:end])) + animate_vs_z(ri, varname; label=label, data=data, + frame_index=frame_index, ax=ax, ir=ir0, input=input) + end + put_legend_below(fig, ax) + # Ensure the first row width is 3/4 of the column width so that + # the plot does not get squashed by the legend + rowsize!(fig.layout, 1, Aspect(1, 3/4)) + resize_to_layout!(fig) + ylims!(ax, ymin, ymax) + save_animation(fig, frame_index, nt, + plot_prefix * "electron_constraints." * input.animation_ext) + end end catch e return makie_post_processing_error_handler( From c3584f0fed26f9550ab1d0d78d5f8390c84d219f Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sat, 11 Jan 2025 14:34:13 +0000 Subject: [PATCH 18/23] Update electron qpar to be saved in debug output file Update will be done at the beginning of the next timestep, but without this explicit update the saved qpar would be inconsistent with the saved (current) g_e. --- moment_kinetics/src/electron_kinetic_equation.jl | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index ad5f39be2..eba1ba1cc 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -1008,6 +1008,15 @@ function electron_backward_euler_pseudotimestepping!(scratch, pdf, moments, phi, # For now can only do I/O within the pseudo-timestepping loop when there # is no r-dimension, because different points in r would take different # number and length of timesteps to converge. + + # Update the electron heat flux for output. This will be done anyway + # before using qpar in the next residual_func!() call, but there is no + # convenient way to include that calculation in this debug output. + moments.electron.qpar_updated[] = false + @views calculate_electron_qpar_from_pdf_no_r!(moments.electron.qpar[:,ir], + electron_ppar_new, + moments.electron.vth[:,ir], + f_electron_new, vpa, ir) begin_serial_region() t_params.moments_output_counter[] += 1 @serial_region begin From 9e4e9b2e7887fa8bc3ba0737d62772e040c1c50a Mon Sep 17 00:00:00 2001 From: John Omotani Date: Sun, 12 Jan 2025 17:42:51 +0000 Subject: [PATCH 19/23] Use explicit pseudotimestep for electrons when ion timestep not IMEX If the ion timestep is not IMEX, the electron pressure cannot be advanced implicitly, which is required for a stable implicit electron timestep. Therefore when not using an IMEX timestep method for ions, use explicit timestepping for electron pseudotimestepping loop. Also include a few small fixes for explicit electron timestepping, to update things that were mildly broken by recent updates. --- moment_kinetics/src/electron_kinetic_equation.jl | 11 ++++------- moment_kinetics/src/initial_conditions.jl | 8 ++++++-- moment_kinetics/src/time_advance.jl | 2 +- 3 files changed, 11 insertions(+), 10 deletions(-) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index eba1ba1cc..7db7a2387 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -200,10 +200,6 @@ function update_electron_pdf_with_time_advance!(scratch, pdf, moments, phi, coll initial_time=nothing, residual_tolerance=nothing, evolve_ppar=false, ion_dt=nothing) - if max_electron_pdf_iterations !== nothing && max_electron_sim_time !== nothing - error("Cannot use both max_electron_pdf_iterations=$max_electron_pdf_iterations " - * "and max_electron_sim_time=$max_electron_sim_time at the same time") - end if max_electron_pdf_iterations === nothing && max_electron_sim_time === nothing error("Must set one of max_electron_pdf_iterations and max_electron_sim_time") end @@ -2273,8 +2269,9 @@ function apply_electron_bc_and_constraints!(this_scratch, phi, moments, r, z, vp moments.electron.upar[:,ir], z, vperp, vpa, vperp_spectral, vpa_spectral, vpa_advect, moments, num_diss_params.electron.vpa_dissipation_coefficient > 0.0, - composition.me_over_mi, ir; lowerz_vcut_inds=lowerz_vcut_inds, - upperz_vcut_inds=upperz_vcut_inds) + composition.me_over_mi, ir; + lowerz_vcut_ind=(lowerz_vcut_inds === nothing ? nothing : lowerz_vcut_inds[ir]), + upperz_vcut_ind=(upperz_vcut_inds === nothing ? nothing : upperz_vcut_inds[ir])) end begin_r_z_region() @@ -4489,7 +4486,7 @@ appropriate. end adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, - error_norm_method, "", 0.0, composition; + error_norm_method, "", 0.0, false, composition; electron=true, local_max_dt=local_max_dt) if t_params.previous_dt[] == 0.0 # Timestep failed, so reset scratch[t_params.n_rk_stages+1] equal to diff --git a/moment_kinetics/src/initial_conditions.jl b/moment_kinetics/src/initial_conditions.jl index 59cb15035..b42e87fef 100644 --- a/moment_kinetics/src/initial_conditions.jl +++ b/moment_kinetics/src/initial_conditions.jl @@ -706,6 +706,8 @@ function initialize_electron_pdf!(scratch, scratch_electron, pdf, moments, field if !skip_electron_solve # Can't let this counter stay set to 0 t_params.electron.dfns_output_counter[] = max(t_params.electron.dfns_output_counter[], 1) + implicit_electron_pseudotimestep = (nl_solver_params.electron_advance !== nothing) + electron_solution_method = implicit_electron_pseudotimestep ? "backward_euler" : "artificial_time_derivative" success = @views update_electron_pdf!(scratch_electron, pdf.electron.norm, moments, fields.phi, r, z, vperp, vpa, @@ -720,7 +722,8 @@ function initialize_electron_pdf!(scratch, scratch_electron, pdf, moments, field io_electron=io_initial_electron, initial_time=code_time, residual_tolerance=t_input["initialization_residual_value"], - evolve_ppar=true) + evolve_ppar=true, + solution_method=electron_solution_method) if success != "" error("!!!max number of iterations for electron pdf update exceeded!!!\n" * "Stopping at $(Dates.format(now(), dateformat"H:MM:SS"))") @@ -795,7 +798,8 @@ function initialize_electron_pdf!(scratch, scratch_electron, pdf, moments, field max_electron_pdf_iterations, max_electron_sim_time; io_electron=io_initial_electron, - evolve_ppar=true, ion_dt=t_params.dt[]) + evolve_ppar=true, ion_dt=t_params.dt[], + solution_method=electron_solution_method) end if success != "" error("!!!max number of iterations for electron pdf update exceeded!!!\n" diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index e1f1d3fce..1bfd853b1 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -2551,7 +2551,7 @@ moments and moment derivatives electron_vpa_advect, scratch_dummy, t_params.electron, collisions, composition, external_source_settings, num_diss_params, nl_solver_params.electron_advance, max_electron_pdf_iterations, - max_electron_sim_time) + max_electron_sim_time, solution_method="artificial_time_derivative") success = kinetic_electron_success end end From ee712fccbb2f06039f9f6e49314906ab5b3032c1 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Fri, 10 Jan 2025 17:26:31 +0000 Subject: [PATCH 20/23] Reduce dt if max_linear_iterations_this_step > 1.5*total_its_soft_limit Hopefully makes simulations more efficient overall. --- moment_kinetics/src/electron_kinetic_equation.jl | 5 +++-- moment_kinetics/src/runge_kutta.jl | 16 +++++++++++++++- moment_kinetics/src/time_advance.jl | 14 ++++++++++---- 3 files changed, 28 insertions(+), 7 deletions(-) diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 7db7a2387..7c8fcde6a 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -4486,8 +4486,9 @@ appropriate. end adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, - error_norm_method, "", 0.0, false, composition; - electron=true, local_max_dt=local_max_dt) + error_norm_method, "", 0.0, false, false, + composition; electron=true, + local_max_dt=local_max_dt) if t_params.previous_dt[] == 0.0 # Timestep failed, so reset scratch[t_params.n_rk_stages+1] equal to # scratch[1] to start the timestep over. diff --git a/moment_kinetics/src/runge_kutta.jl b/moment_kinetics/src/runge_kutta.jl index 6ea53ba10..481e3f725 100644 --- a/moment_kinetics/src/runge_kutta.jl +++ b/moment_kinetics/src/runge_kutta.jl @@ -1059,6 +1059,7 @@ end adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, error_norm_method, success, nl_max_its_fraction, nl_total_its_soft_limit, + nl_total_its_soft_limit_reduce_dt, composition; electron=false, local_max_dt::mk_float=Inf) @@ -1067,6 +1068,7 @@ Use the calculated `CFL_limits` and `error_norms` to update the timestep in `t_p function adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, error_norm_method, success, nl_max_its_fraction, nl_total_its_soft_limit, + nl_total_its_soft_limit_reduce_dt, composition; electron=false, local_max_dt::mk_float=Inf) # Get global minimum of CFL limits @@ -1327,7 +1329,19 @@ function adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, end end - if (nl_max_its_fraction > 0.5 || nl_total_its_soft_limit) && t_params.previous_dt[] > 0.0 + if nl_total_its_soft_limit_reduce_dt && t_params.previous_dt[] > 0.0 + # The last step took very many nonlinear iterations, so reduce the + # timestep slightly. + # If t_params.previous_dt[]==0.0, then the previous step failed so + # timestep will not be increasing, so do not need this check. + iteration_limited_dt = t_params.previous_dt[] / t_params.max_increase_factor + if t_params.dt[] > iteration_limited_dt + t_params.dt[] = iteration_limited_dt + @serial_region begin + this_limit_caused_by = 5 + end + end + elseif (nl_max_its_fraction > 0.5 || nl_total_its_soft_limit) && t_params.previous_dt[] > 0.0 # The last step took many nonlinear iterations, so do not allow the # timestep to increase. # If t_params.previous_dt[]==0.0, then the previous step failed so diff --git a/moment_kinetics/src/time_advance.jl b/moment_kinetics/src/time_advance.jl index 1bfd853b1..777f9b4ec 100644 --- a/moment_kinetics/src/time_advance.jl +++ b/moment_kinetics/src/time_advance.jl @@ -2635,7 +2635,8 @@ end advect_objects, gyroavs, num_diss_params, nl_solver_params, advance, scratch_dummy, r, z, vperp, vpa, vzeta, vr, vz, success, nl_max_its_fraction, - nl_total_its_soft_limit) + nl_total_its_soft_limit, + nl_total_its_soft_limit_reduce_dt) Check the error estimate for the embedded RK method and adjust the timestep if appropriate. @@ -2646,7 +2647,8 @@ appropriate. geometry, external_source_settings, spectral_objects, advect_objects, gyroavs, num_diss_params, nl_solver_params, advance, scratch_dummy, r, z, vperp, vpa, vzeta, vr, vz, success, - nl_max_its_fraction, nl_total_its_soft_limit) = begin + nl_max_its_fraction, nl_total_its_soft_limit, + nl_total_its_soft_limit_reduce_dt) = begin #error_norm_method = "Linf" error_norm_method = "L2" @@ -2960,7 +2962,8 @@ appropriate. adaptive_timestep_update_t_params!(t_params, CFL_limits, error_norms, total_points, error_norm_method, success, nl_max_its_fraction, - nl_total_its_soft_limit, composition) + nl_total_its_soft_limit, + nl_total_its_soft_limit_reduce_dt, composition) if composition.electron_physics ∈ (kinetic_electrons, kinetic_electrons_with_temperature_equation) @@ -3262,6 +3265,7 @@ end if t_params.adaptive nl_max_its_fraction = 0.0 nl_total_its_soft_limit = false + nl_total_its_soft_limit_reduce_dt = false if t_params.implicit_electron_advance || t_params.implicit_electron_time_evolving params_to_check = (nl_solver_params.ion_advance, nl_solver_params.vpa_advection, @@ -3288,6 +3292,7 @@ end max(p.max_nonlinear_iterations_this_step[] / p.nonlinear_max_iterations, nl_max_its_fraction) nl_total_its_soft_limit = p.max_linear_iterations_this_step[] > p.total_its_soft_limit || nl_total_its_soft_limit + nl_total_its_soft_limit_reduce_dt = p.max_linear_iterations_this_step[] > 1.5 * p.total_its_soft_limit || nl_total_its_soft_limit_reduce_dt end end adaptive_timestep_update!(scratch, scratch_implicit, scratch_electron, @@ -3297,7 +3302,8 @@ end advect_objects, gyroavs, num_diss_params, nl_solver_params, advance, scratch_dummy, r, z, vperp, vpa, vzeta, vr, vz, success, nl_max_its_fraction, - nl_total_its_soft_limit) + nl_total_its_soft_limit, + nl_total_its_soft_limit_reduce_dt) elseif success != "" error("Implicit part of timestep failed") end From e23c75c9d4dd04764b948cea99cfd0626a286af4 Mon Sep 17 00:00:00 2001 From: John Omotani Date: Mon, 13 Jan 2025 11:28:12 +0000 Subject: [PATCH 21/23] Increase timeout for 'longtest' CI job We have added new tests (Fokker-Planck collision operator and kinetic electrons), which made the job take too long for the previous timeout. --- .github/workflows/longtest.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/longtest.yml b/.github/workflows/longtest.yml index 8d4990bb6..5c0890c04 100644 --- a/.github/workflows/longtest.yml +++ b/.github/workflows/longtest.yml @@ -15,7 +15,7 @@ jobs: matrix: os: [ubuntu-latest, macOS-latest] fail-fast: false - timeout-minutes: 90 + timeout-minutes: 120 steps: - uses: actions/checkout@v4 From 64276bff3b1a22729c210dddc64b6239d206755a Mon Sep 17 00:00:00 2001 From: John Omotani Date: Mon, 13 Jan 2025 17:15:51 +0000 Subject: [PATCH 22/23] Avoid allocations in gauss_legendre.mass_matrix_solve! Use the in-place version `ldiv!()` for the matrix solve. --- moment_kinetics/src/gauss_legendre.jl | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/moment_kinetics/src/gauss_legendre.jl b/moment_kinetics/src/gauss_legendre.jl index 8bfd386ea..bb5135ba9 100644 --- a/moment_kinetics/src/gauss_legendre.jl +++ b/moment_kinetics/src/gauss_legendre.jl @@ -23,7 +23,7 @@ export get_QQ_local! using FastGaussQuadrature using LegendrePolynomials: Pl, dnPl -using LinearAlgebra: mul!, lu, LU +using LinearAlgebra: mul!, lu, ldiv! using SparseArrays: sparse, AbstractSparseArray using SparseMatricesCSR using ..type_definitions: mk_float, mk_int @@ -459,8 +459,7 @@ Function to carry out a 1D (global) mass matrix solve. """ function mass_matrix_solve!(f, b, spectral::gausslegendre_info) # invert mass matrix system - y = spectral.mass_matrix_lu \ b - @. f = y + ldiv!(f, spectral.mass_matrix_lu, b) return nothing end From a0b0a72afa60d552039f78b55e233c6982be16fc Mon Sep 17 00:00:00 2001 From: John Omotani Date: Mon, 13 Jan 2025 17:18:44 +0000 Subject: [PATCH 23/23] Micro-optimise a few electron-advance loops Removes some allocations, and speeds up a few loops. The speed-up for a given loop is substantial, but these loops were not a large fraction of the run-time, so the overall effect will be minimal. Also adds a few extra timers to ensure all functions in `electron_kinetic_equation_euler_update!()` are timed. --- .../src/electron_fluid_equations.jl | 17 +++--- .../src/electron_kinetic_equation.jl | 57 ++++++++++--------- moment_kinetics/src/electron_vpa_advection.jl | 8 +-- moment_kinetics/src/external_sources.jl | 7 +-- 4 files changed, 46 insertions(+), 43 deletions(-) diff --git a/moment_kinetics/src/electron_fluid_equations.jl b/moment_kinetics/src/electron_fluid_equations.jl index 516e81161..c77d8c1ac 100644 --- a/moment_kinetics/src/electron_fluid_equations.jl +++ b/moment_kinetics/src/electron_fluid_equations.jl @@ -132,6 +132,7 @@ function calculate_electron_moments!(scratch, pdf, moments, composition, collisi else pdf_electron = pdf.electron end + electron_ppar = scratch.electron_ppar calculate_electron_density!(scratch.electron_density, moments.electron.dens_updated, scratch.density) calculate_electron_upar_from_charge_conservation!( @@ -141,20 +142,20 @@ function calculate_electron_moments!(scratch, pdf, moments, composition, collisi kinetic_electrons_with_temperature_equation) begin_r_z_region() @loop_r_z ir iz begin - scratch.electron_ppar[iz,ir] = 0.5 * composition.me_over_mi * - scratch.electron_density[iz,ir] * - moments.electron.vth[iz,ir]^2 + electron_ppar[iz,ir] = 0.5 * composition.me_over_mi * + scratch.electron_density[iz,ir] * + moments.electron.vth[iz,ir]^2 end moments.electron.ppar_updated[] = true end - update_electron_vth_temperature!(moments, scratch.electron_ppar, - scratch.electron_density, composition) - calculate_electron_qpar!(moments.electron, pdf_electron, scratch.electron_ppar, + update_electron_vth_temperature!(moments, electron_ppar, scratch.electron_density, + composition) + calculate_electron_qpar!(moments.electron, pdf_electron, electron_ppar, scratch.electron_upar, scratch.upar, collisions.electron_fluid.nu_ei, composition.me_over_mi, composition.electron_physics, vpa) if composition.electron_physics == braginskii_fluid - electron_fluid_qpar_boundary_condition!(scratch.electron_ppar, + electron_fluid_qpar_boundary_condition!(electron_ppar, scratch.electron_upar, scratch.electron_density, moments.electron, z) @@ -869,7 +870,7 @@ function calculate_electron_qpar_from_pdf!(qpar, ppar, vth, pdf, vpa) begin_r_z_region() ivperp = 1 @loop_r_z ir iz begin - @views qpar[iz, ir] = 2*ppar[iz,ir]*vth[iz,ir]*integrate_over_vspace(pdf[:, ivperp, iz, ir], vpa.grid.^3, vpa.wgts) + @views qpar[iz, ir] = 2*ppar[iz,ir]*vth[iz,ir]*integrate_over_vspace(pdf[:, ivperp, iz, ir], vpa.grid, 3, vpa.wgts) end end diff --git a/moment_kinetics/src/electron_kinetic_equation.jl b/moment_kinetics/src/electron_kinetic_equation.jl index 7c8fcde6a..556490a6d 100644 --- a/moment_kinetics/src/electron_kinetic_equation.jl +++ b/moment_kinetics/src/electron_kinetic_equation.jl @@ -4775,18 +4775,20 @@ Note that this function operates on a single point in `r`, given by `ir`, and `f composition, external_source_settings.electron, num_diss_params, z, ir) if ion_dt !== nothing - # Add source term to turn steady state solution into a backward-Euler update of - # electron_ppar with the ion timestep `ion_dt`. - ppar_previous_ion_step = moments.electron.ppar - begin_z_region() - @loop_z iz begin - # At this point, ppar_out = ppar_in + dt*RHS(ppar_in). Here we add a - # source/damping term so that in the steady state of the electron - # pseudo-timestepping iteration, - # RHS(ppar) - (ppar - ppar_previous_ion_step) / ion_dt = 0, - # resulting in a backward-Euler step (as long as the pseudo-timestepping - # loop converges). - ppar_out[iz] += -dt * (ppar_in[iz] - ppar_previous_ion_step[iz,ir]) / ion_dt + @timeit global_timer "electron_ppar_ion_dt" begin + # Add source term to turn steady state solution into a backward-Euler + # update of electron_ppar with the ion timestep `ion_dt`. + ppar_previous_ion_step = moments.electron.ppar + begin_z_region() + @loop_z iz begin + # At this point, ppar_out = ppar_in + dt*RHS(ppar_in). Here we add a + # source/damping term so that in the steady state of the electron + # pseudo-timestepping iteration, + # RHS(ppar) - (ppar - ppar_previous_ion_step) / ion_dt = 0, + # resulting in a backward-Euler step (as long as the + # pseudo-timestepping loop converges). + ppar_out[iz] += -dt * (ppar_in[iz] - ppar_previous_ion_step[iz,ir]) / ion_dt + end end end end @@ -5521,8 +5523,8 @@ function add_source_term!(source_term, vpa, z, dvth_dz) return nothing end -function add_dissipation_term!(pdf_out, pdf_in, scratch_dummy, z_spectral, z, vpa, - vpa_spectral, num_diss_params, dt) +@timeit global_timer add_dissipation_term!(pdf_out, pdf_in, scratch_dummy, z_spectral, z, + vpa, vpa_spectral, num_diss_params, dt) = begin if num_diss_params.electron.vpa_dissipation_coefficient ≤ 0.0 return nothing end @@ -5530,7 +5532,7 @@ function add_dissipation_term!(pdf_out, pdf_in, scratch_dummy, z_spectral, z, vp begin_z_vperp_region() @loop_z_vperp iz ivperp begin @views second_derivative!(vpa.scratch, pdf_in[:,ivperp,iz], vpa, vpa_spectral) - @. pdf_out[:,ivperp,iz] += dt * num_diss_params.electron.vpa_dissipation_coefficient * vpa.scratch + @views @. pdf_out[:,ivperp,iz] += dt * num_diss_params.electron.vpa_dissipation_coefficient * vpa.scratch end return nothing end @@ -5803,13 +5805,14 @@ function calculate_pdf_dot_prefactor!(pdf_dot_prefactor, ppar, vth, dens, ddens_ end # add contribution to the residual coming from the term proporational to the pdf -function add_contribution_from_pdf_term!(pdf_out, pdf_in, ppar, dens, upar, moments, vpa, - z, dt, electron_source_settings, ir) +@timeit global_timer add_contribution_from_pdf_term!(pdf_out, pdf_in, ppar, dens, upar, + moments, vpa, z, dt, + electron_source_settings, ir) = begin vth = @view moments.electron.vth[:,ir] ddens_dz = @view moments.electron.ddens_dz[:,ir] dvth_dz = @view moments.electron.dvth_dz[:,ir] dqpar_dz = @view moments.electron.dqpar_dz[:,ir] - begin_z_vperp_vpa_region() + begin_z_vperp_region() @loop_z iz begin this_dqpar_dz = dqpar_dz[iz] this_ppar = ppar[iz] @@ -5818,11 +5821,11 @@ function add_contribution_from_pdf_term!(pdf_out, pdf_in, ppar, dens, upar, mome this_dens = dens[iz] this_dvth_dz = dvth_dz[iz] this_vth = vth[iz] - @loop_vperp_vpa ivperp ivpa begin - pdf_out[ivpa,ivperp,iz] += - dt * (-0.5 * this_dqpar_dz / this_ppar - vpa[ivpa] * this_vth * + @loop_vperp ivperp begin + @views @. pdf_out[:,ivperp,iz] += + dt * (-0.5 * this_dqpar_dz / this_ppar - vpa * this_vth * (this_ddens_dz / this_dens - this_dvth_dz / this_vth)) * - pdf_in[ivpa,ivperp,iz] + pdf_in[:,ivperp,iz] end end @@ -5832,11 +5835,11 @@ function add_contribution_from_pdf_term!(pdf_out, pdf_in, ppar, dens, upar, mome @views source_momentum_amplitude = moments.electron.external_source_momentum_amplitude[:, ir, index] @views source_pressure_amplitude = moments.electron.external_source_pressure_amplitude[:, ir, index] @loop_z iz begin - term = dt * (1.5 * source_density_amplitude[iz,ir] / dens[iz,ir] - - (0.5 * source_pressure_amplitude[iz,ir] + - source_momentum_amplitude[iz,ir]) / ppar[iz,ir]) - @loop_vperp_vpa ivperp ivpa begin - pdf_out[ivpa,ivperp,iz,ir] -= term * pdf_in[ivpa,ivperp,iz,ir] + term = dt * (1.5 * source_density_amplitude[iz] / dens[iz] - + (0.5 * source_pressure_amplitude[iz] + + source_momentum_amplitude[iz]) / ppar[iz]) + @loop_vperp ivperp begin + @views @. pdf_out[:,ivperp,iz] -= term * pdf_in[:,ivperp,iz] end end end diff --git a/moment_kinetics/src/electron_vpa_advection.jl b/moment_kinetics/src/electron_vpa_advection.jl index 2ffcc3298..07e14d876 100644 --- a/moment_kinetics/src/electron_vpa_advection.jl +++ b/moment_kinetics/src/electron_vpa_advection.jl @@ -61,10 +61,10 @@ function update_electron_speed_vpa!(advect, density, upar, ppar, moments, vpa, dppar_dz = @view moments.electron.dppar_dz[:,ir] dqpar_dz = @view moments.electron.dqpar_dz[:,ir] dvth_dz = @view moments.electron.dvth_dz[:,ir] - speed = advect.speed + speed = @view advect.speed[:,:,:,ir] # calculate the advection speed in wpa @loop_z_vperp_vpa iz ivperp ivpa begin - speed[ivpa,ivperp,iz,ir] = ((vth[iz] * dppar_dz[iz] + vpa[ivpa] * dqpar_dz[iz]) + speed[ivpa,ivperp,iz] = ((vth[iz] * dppar_dz[iz] + vpa[ivpa] * dqpar_dz[iz]) / (2 * ppar[iz]) - vpa[ivpa]^2 * dvth_dz[iz]) end @@ -80,8 +80,8 @@ function update_electron_speed_vpa!(advect, density, upar, ppar, moments, vpa, 2.0 * upar[iz] * source_momentum_amplitude[iz]) / ppar[iz] + 0.5 * source_density_amplitude[iz] / density[iz] - @loop_vperp_vpa ivperp ivpa begin - speed[ivpa,ivperp,iz,ir] += term1 + vpa[ivpa] * term2_over_vpa + @loop_vperp ivperp begin + @. speed[:,ivperp,iz] += term1 + vpa * term2_over_vpa end end end diff --git a/moment_kinetics/src/external_sources.jl b/moment_kinetics/src/external_sources.jl index c1990325c..2195c3217 100644 --- a/moment_kinetics/src/external_sources.jl +++ b/moment_kinetics/src/external_sources.jl @@ -989,14 +989,13 @@ Note that this function operates on a single point in `r`, given by `ir`, and `p this_upar = electron_upar[iz] this_prefactor = dt * this_vth / electron_density[iz] * vth_factor * source_amplitude[iz] - @loop_vperp_vpa ivperp ivpa begin + @loop_vperp ivperp begin # Factor of 1/sqrt(π) (for 1V) or 1/π^(3/2) (for 2V/3V) is absorbed by the # normalisation of F vperp_unnorm = vperp_grid[ivperp] * this_vth - vpa_unnorm = vpa_grid[ivpa] * this_vth + this_upar - pdf_out[ivpa,ivperp,iz] += + @. pdf_out[:,ivperp,iz] += this_prefactor * - exp(-(vperp_unnorm^2 + vpa_unnorm^2) * me_over_mi / source_T) + exp(-(vperp_unnorm^2 + (vpa_grid * this_vth + this_upar)^2) * me_over_mi / source_T) end end