-
Notifications
You must be signed in to change notification settings - Fork 0
/
submit_anime_gilbreth.sh
57 lines (41 loc) · 1.57 KB
/
submit_anime_gilbreth.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
#!/bin/bash
# change the directory path of model run-time output and error messages to your own
#SBATCH --output=/scratch/gilbreth/gupt1075/run_fourcastnet.out
#SBATCH --error=/scratch/gilbreth/gupt1075/run_fourcastnet.err
# The file name of this submission file, so it's easier to track jobs
# filename: submit_run_model_example.sub
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=32
#SBATCH --gres=gpu:1
#SBATCH --time=23:00:00
# partner queue has a 24-hour limit
#SBATCH -A gdsp-k
#SBATCH -C "v100|a100"
# Job name, it will show up when you track this job
#SBATCH -J fourcastnet_job
# Use your email address so that you will receive email notifications about the job begin, end, or fail status
# To submit the job via command line:$ sbatch submit_run_model_example.sub
# To check status of the submitted job:$ squeue -u yourUserID
module --force purge
unset PYTHONPATH
module load anaconda/5.3.1-py37
module load cuda/11.7.0
module load cudnn/cuda-11.7_8.6
module use /depot/gdsp/etc/modules
module load utilities monitor
module load rcac
module list
export PRECXX11ABI=1
export CUDA="11.7"
echo $PYTHONPATH
# # track per-code CPU load
# monitor cpu percent --all-cores >cpu-percent.log &
# CPU_PID=$!
# # track memory usage
# monitor cpu memory >cpu-memory.log &
# MEM_PID=$!
source /apps/spack/gilbreth/apps/anaconda/5.3.1-py37-gcc-4.8.5-7vvmykn/etc/profile.d/conda.sh
conda activate pytorch
# Change this directory to where you save the model-related files such as run_model.py
cd /scratch/gilbreth/wwtung/FourCastNet/
python /scratch/gilbreth/gupt1075/FourCastNet/animate_input.py