rename training_old -> training

delphi-suite · jaidhyani · Mar 19, 2024 · Feb 4, 2024 · Feb 4, 2024 · Feb 4, 2024
commit fe834b03e72f588bef0203f045e45bf0a620b451
diff --git a/src/delphi/train/training_old.py → src/delphi/train/training.py b/src/delphi/train/training_old.py → src/delphi/train/training.py
diff --git a/src/delphi/train/training_old.sh → src/delphi/train/training.sh b/src/delphi/train/training_old.sh → src/delphi/train/training.sh
@@ -3,4 +3,4 @@ export CUDA_VISIBLE_DEVICES=3
 export TRANSFORMERS_CACHE=/ceph/jbrinkma/cache/transformers
 export HF_DATASETS_CACHE=/ceph/jbrinkma/cache/datasets
 
-python3 training_old.py --vocab_source=custom  --vocab_size=4096 --max_seq_len=512 --dim=48 --n_layers=8 --n_heads=8 --n_kv_heads=4
+python3 training.py --vocab_source=custom  --vocab_size=4096 --max_seq_len=512 --dim=48 --n_layers=8 --n_heads=8 --n_kv_heads=4