Skip to content

Commit

Permalink
Only capture nsys in solve-atmos
Browse files Browse the repository at this point in the history
Try with timed_solve

Try range-at-domain

Try with single quotes

Try using delay keyword

Shorten simulations

wip
  • Loading branch information
charleskawczynski committed Oct 29, 2024
1 parent 7d36e14 commit 39cd680
Show file tree
Hide file tree
Showing 5 changed files with 24 additions and 23 deletions.
2 changes: 1 addition & 1 deletion .buildkite/comparison/pipeline.sh
Original file line number Diff line number Diff line change
Expand Up @@ -75,7 +75,7 @@ else
fi

if [[ "$profiling" == "enable" ]]; then
command="nsys profile --trace=nvtx,mpi --mpi-impl=mpich --output=${job_id}/report.%q{NPROCS}.%q{PMI_RANK} $command"
command="nsys profile --delay 100 --trace=nvtx,mpi --mpi-impl=mpich --output=${job_id}/report.%q{NPROCS}.%q{PMI_RANK} $command"
fi

cat << EOM
Expand Down
19 changes: 10 additions & 9 deletions .buildkite/gpu_pipeline/pipeline.yml
Original file line number Diff line number Diff line change
Expand Up @@ -51,7 +51,7 @@ steps:
command:
- mkdir -p target_gpu_implicit_baroclinic_wave
- >
nsys profile --trace=nvtx,mpi,cuda,osrt --output=target_gpu_implicit_baroclinic_wave/output_active/report
nsys profile --delay 100 --trace=nvtx,mpi,cuda,osrt --output=target_gpu_implicit_baroclinic_wave/output_active/report
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}target_gpu_implicit_baroclinic_wave.yml
--job_id target_gpu_implicit_baroclinic_wave
Expand All @@ -68,7 +68,7 @@ steps:
command:
- mkdir -p gpu_hs_rhoe_equil_55km_nz63_0M
- >
nsys profile --trace=nvtx,mpi,cuda,osrt --output=gpu_hs_rhoe_equil_55km_nz63_0M/output_active/report
nsys profile --delay 100 --trace=nvtx,mpi,cuda,osrt --output=gpu_hs_rhoe_equil_55km_nz63_0M/output_active/report
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}gpu_hs_rhoe_equil_55km_nz63_0M.yml
--job_id gpu_hs_rhoe_equil_55km_nz63_0M
Expand All @@ -86,7 +86,7 @@ steps:
- mkdir -p gpu_hs_rhoe_equil_55km_nz63_0M_4process
- >
srun --cpu-bind=threads --cpus-per-task=4
nsys profile --trace=nvtx,mpi,cuda,osrt --output=gpu_hs_rhoe_equil_55km_nz63_0M_4process/output_active/report-%q{PMI_RANK}
nsys profile --delay 100 --trace=nvtx,mpi,cuda,osrt --output=gpu_hs_rhoe_equil_55km_nz63_0M_4process/output_active/report-%q{PMI_RANK}
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}gpu_hs_rhoe_equil_55km_nz63_0M.yml
--job_id gpu_hs_rhoe_equil_55km_nz63_0M_4process
Expand All @@ -106,7 +106,7 @@ steps:
- mkdir -p target_gpu_implicit_baroclinic_wave_4process
- >
srun --cpu-bind=threads --cpus-per-task=4
nsys profile --trace=osrt,nvtx,cuda,mpi,ucx --output=target_gpu_implicit_baroclinic_wave_4process/output_active/report-%q{PMI_RANK}
nsys profile --delay 100 --trace=osrt,nvtx,cuda,mpi,ucx --output=target_gpu_implicit_baroclinic_wave_4process/output_active/report-%q{PMI_RANK}
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}target_gpu_implicit_baroclinic_wave.yml
--job_id target_gpu_implicit_baroclinic_wave_4process
Expand All @@ -128,7 +128,7 @@ steps:
- mkdir -p gpu_aquaplanet_dyamond_diag_1process
- >
srun --cpu-bind=threads --cpus-per-task=4
nsys profile --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_dyamond_diag_1process/output_active/report julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
nsys profile --delay 100 --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_dyamond_diag_1process/output_active/report julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}gpu_aquaplanet_dyamond_diag_1process.yml
--job_id gpu_aquaplanet_dyamond_diag_1process
artifact_paths: "gpu_aquaplanet_dyamond_diag_1process/output_active/*"
Expand All @@ -148,7 +148,7 @@ steps:
- mkdir -p gpu_aquaplanet_dyamond_ss_1process
- >
srun --cpu-bind=threads --cpus-per-task=4
nsys profile --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_dyamond_ss_1process/output_active/report
nsys profile --delay 100 --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_dyamond_ss_1process/output_active/report
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}gpu_aquaplanet_dyamond_ss.yml
--job_id gpu_aquaplanet_dyamond_ss_1process
Expand Down Expand Up @@ -307,7 +307,7 @@ steps:
command:
- mkdir -p gpu_aquaplanet_diagedmf
- >
nsys profile --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_diagedmf/output_active/report
nsys profile --delay 200 --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_diagedmf/output_active/report
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${MODEL_CONFIG_PATH}aquaplanet_diagedmf.yml
--job_id gpu_aquaplanet_diagedmf
Expand All @@ -319,7 +319,7 @@ steps:
slurm_gpus_per_task: 1
slurm_cpus_per_task: 4
slurm_ntasks: 1
slurm_mem: 32G
slurm_mem: 64G
slurm_exclusive:

- label: "gpu_aquaplanet_diagedmf_benchmark"
Expand All @@ -331,6 +331,7 @@ steps:
env:
CLIMACOMMS_DEVICE: "CUDA"
agents:
slurm_mem: 64G
slurm_gpus: 1

- group: "Prognostic EDMF GPU"
Expand All @@ -340,7 +341,7 @@ steps:
command:
- mkdir -p gpu_aquaplanet_progedmf
- >
nsys profile --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_progedmf/output_active/report
nsys profile --delay 100 --trace=nvtx,mpi,cuda,osrt --output=gpu_aquaplanet_progedmf/output_active/report
julia --threads=3 --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${MODEL_CONFIG_PATH}aquaplanet_progedmf.yml
--job_id gpu_aquaplanet_progedmf
Expand Down
8 changes: 4 additions & 4 deletions .buildkite/pipeline.yml
Original file line number Diff line number Diff line change
Expand Up @@ -871,7 +871,7 @@ steps:
command:
- mkdir -p target_gpu_implicit_baroclinic_wave
- >
nsys profile --trace=nvtx,cuda --output=target_gpu_implicit_baroclinic_wave/output_active/report
nsys profile --delay 100 --trace=nvtx,cuda --output=target_gpu_implicit_baroclinic_wave/output_active/report
julia --color=yes --project=examples examples/hybrid/driver.jl
--config_file ${GPU_CONFIG_PATH}/target_gpu_implicit_baroclinic_wave.yml
--job_id target_gpu_implicit_baroclinic_wave
Expand All @@ -885,7 +885,7 @@ steps:
- label: "GPU: GPU dry baroclinic wave - 4 gpus"
key: "target_gpu_implicit_baroclinic_wave_4process"
command:
# nsys profile --trace=nvtx,cuda,mpi --output=target_gpu_implicit_baroclinic_wave_4process/output_active/report-%q{PMI_RANK}
nsys profile --delay 100 --trace=nvtx,cuda,mpi --output=target_gpu_implicit_baroclinic_wave_4process/output_active/report-%q{PMI_RANK}
- mkdir -p target_gpu_implicit_baroclinic_wave_4process
- >
srun --cpu-bind=threads --cpus-per-task=4
Expand All @@ -905,7 +905,7 @@ steps:
- label: "GPU: GPU moist Held-Suarez"
command:
- >
nsys profile --trace=nvtx,cuda --output=central_gpu_hs_rhoe_equil_55km_nz63_0M/output_active/report
nsys profile --delay 100 --trace=nvtx,cuda --output=central_gpu_hs_rhoe_equil_55km_nz63_0M/output_active/report
julia --color=yes --project=examples examples/hybrid/driver.jl
--config_file $CONFIG_PATH/central_gpu_hs_rhoe_equil_55km_nz63_0M.yml
--job_id central_gpu_hs_rhoe_equil_55km_nz63_0M
Expand All @@ -919,7 +919,7 @@ steps:
- label: "GPU: GPU moist Held-Suarez cloud diagnostics per stage"
command:
- >
nsys profile --trace=nvtx,cuda --output=central_cloud_diag_gpu_hs_rhoe_equil_55km_nz63_0M/output_active/report
nsys profile --delay 100 --trace=nvtx,cuda --output=central_cloud_diag_gpu_hs_rhoe_equil_55km_nz63_0M/output_active/report
julia --color=yes --project=examples examples/hybrid/driver.jl
--config_file $CONFIG_PATH/central_cloud_diag_gpu_hs_rhoe_equil_55km_nz63_0M.yml
--job_id central_cloud_diag_gpu_hs_rhoe_equil_55km_nz63_0M
Expand Down
16 changes: 8 additions & 8 deletions config/model_configs/aquaplanet_diagedmf.yml
Original file line number Diff line number Diff line change
Expand Up @@ -7,25 +7,25 @@ z_elem: 63
dz_bottom: 30.0
rayleigh_sponge: true
viscous_sponge: true
moist: equil
surface_setup: DefaultMoninObukhov
moist: equil
surface_setup: DefaultMoninObukhov
rad: allskywithclear
insolation: "timevarying"
dt_rad: 1hours
dt_cloud_fraction: 1hours
turbconv: diagnostic_edmfx
turbconv: diagnostic_edmfx
implicit_diffusion: true
approximate_linear_solve_iters: 2
prognostic_tke: true
edmfx_upwinding: first_order
edmfx_entr_model: "Generalized"
edmfx_detr_model: "Generalized"
edmfx_nh_pressure: true
edmfx_upwinding: first_order
edmfx_entr_model: "Generalized"
edmfx_detr_model: "Generalized"
edmfx_nh_pressure: true
edmfx_sgs_mass_flux: true
edmfx_sgs_diffusive_flux: true
cloud_model: "quadrature_sgs"
precip_model: 0M
dt: 90secs
t_end: 1days
t_end: 61mins
toml: [toml/diagnostic_edmfx.toml]
ode_algo: ARS343
2 changes: 1 addition & 1 deletion config/model_configs/aquaplanet_progedmf.yml
Original file line number Diff line number Diff line change
Expand Up @@ -28,6 +28,6 @@ edmfx_sgs_mass_flux: true
edmfx_sgs_diffusive_flux: true
precip_model: 0M
dt: 10secs
t_end: 3hours
t_end: 61mins
toml: [toml/prognostic_edmfx.toml]
ode_algo: ARS343

0 comments on commit 39cd680

Please sign in to comment.