-
Notifications
You must be signed in to change notification settings - Fork 1
/
run.sh
72 lines (68 loc) · 2.09 KB
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
# NOTE: remember to change feature path in config.py if you change the feature
method='commit'
# R2R
if [ $1 = "R2R" ]; then
echo "====R2R===="
# --not_load_strict \
# --evaluate_first \
python src/main.py --log \
--method $method \
--description 'R2R,MLM,CLIP,' \
--mask_visited \
--use_panorama \
--use_directed \
--OPE_layer_num 2 \
--MAM_layer_num 4 \
--CCM_layer_num 1 \
--dataset 'R2R' \
--model 'PRET' \
--agent 'AgentPath' \
--trainer 'TF_SF' \
--text_backbone 'ALBEF' \
--gpu '0' \
--lr 0.00001 \
--batch_size 8 \
--dropout 0.5 \
--lr_scheduler cosine \
--iteration_num 100000 \
--log_every 1000 \
--loss_weight 0.2 \
--max_step 15 \
--load 'temp/log/commit/2024-02-27_21:50:24_pretrain,R2R,MLM,CLIP'
# --load 'log/commit/2024-03-01_15:03:33_R2R,MLM,CLIP'
fi
# RxR dataset
# RxR requires more GPU memory, and longer max_step
# Gradient Checkpoint is used in multilingual Roberta to save memory
# RxR uses higher loss_weight to follow the path.
if [ $1 = "RxR" ]; then
echo "====RxR===="
# --evaluate_first \
python src/main.py --log \
--method $method \
--description 'RxR,bs4,MLM,CLIP,' \
--mask_visited \
--use_panorama \
--use_directed \
--not_load_strict \
--OPE_layer_num 2 \
--MAM_layer_num 4 \
--CCM_layer_num 1 \
--dataset 'RxR' \
--model 'PRET' \
--agent 'AgentPath' \
--trainer 'TF_SF' \
--gpu '0' \
--lr 0.00001 \
--dropout 0.5 \
--batch_size 4 \
--lr_scheduler cosine \
--iteration_num 200000 \
--log_every 5000 \
--loss_weight 0.4 \
--max_step 20 \
--load 'log/commit/2024-03-02_00:12:15_RxR,bs4,MLM,CLIP'
# --load 'log/commit/2023-10-08_17:28:11_pretrain, RxR'
# change the directory path to load different model
# use not_load_strict as some checkpoints does not contain CCM module
fi