-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathlemmatization-config.py
33 lines (29 loc) · 1.01 KB
/
lemmatization-config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
log_file = "logs/lemmatization.log"
train_file = (
"data/ud-treebanks-v2.14/UD_Ancient_Greek-Perseus/grc_perseus-ud-train.conllu"
)
valid_file = (
"data/ud-treebanks-v2.14/UD_Ancient_Greek-Perseus/grc_perseus-ud-dev.conllu"
)
test_file = (
"data/ud-treebanks-v2.14/UD_Ancient_Greek-Perseus/grc_perseus-ud-test.conllu"
)
output_dir = "models/lemmatization"
sweep_config = {
"method": "grid",
"parameters": {
"learning_rate": {"values": [1e-5]}, # , 3e-5, 5e-5]
"model_name_or_path": {"values": ["bowphs/GreTa"]},
"num_train_epochs": {
"values": [2],
},
"per_device_train_batch_size": {"values": [16]},
"per_device_eval_batch_size": {"values": [16]},
"weight_decay": {"values": [0.01]},
"run_name": {"value": "demorun"},
"predict_with_generate": {"value": True},
"generation_max_length": {"value": 30},
"generation_num_beams": {"value": 20},
},
"metric": {"name": "eval/exact_match", "goal": "maximize"},
}