-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathconfig.py
65 lines (62 loc) · 2.42 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
RANDOM_SEED = 0
DATASET_PATHS = {
'english': {
'train': 'data/subtask-1a--english/normalized/dataset_train.tsv',
'dev': 'data/subtask-1a--english/normalized/dataset_dev.tsv',
'test': 'data/subtask-1a--english/dataset_test_input_english.tsv'
},
'turkish': {
'train': 'data/subtask-1a--turkish/normalized/dataset_train_v1_turkish.tsv',
'dev': 'data/subtask-1a--turkish/normalized/dataset_dev_v1_turkish.tsv',
'test': 'data/subtask-1a--turkish/dataset_test_v1_turkish.tsv',
},
'spanish': {
'train': 'data/subtask-1a--spanish/normalized/dataset_train.tsv',
'dev': 'data/subtask-1a--spanish/normalized/dataset_dev.tsv',
'test': 'data/subtask-1a--spanish/dataset_test_participants.tsv',
},
'bulgarian': {
'train': 'data/subtask-1a--bulgarian/dataset_train_v1_bulgarian.tsv',
'dev': 'data/subtask-1a--bulgarian/dataset_dev_v1_bulgarian.tsv',
'test': 'data/subtask-1a--bulgarian/dataset_test_input_bulgarian.tsv',
},
'arabic': {
'train': 'data/subtask-1a--arabic/normalized/train.tsv',
'dev': 'data/subtask-1a--arabic/normalized/dev.tsv',
'test': 'data/subtask-1a--arabic/CT21-AR-Test-T1.tsv',
}
}
CV_DATASET_PATHS = {
'english': {
'train': 'data/subtask-1a--english/folds',
'dev': 'data/subtask-1a--english/normalized/dataset_dev.tsv',
'test': 'data/subtask-1a--english/dataset_test_input_english.tsv'
},
'turkish': {
'train': 'data/subtask-1a--turkish/folds',
'dev': 'data/subtask-1a--turkish/normalized/dataset_dev_v1_turkish.tsv',
'test': 'data/subtask-1a--turkish/dataset_test_v1_turkish.tsv',
},
'spanish': {
'train': 'data/subtask-1a--spanish/folds',
'dev': 'data/subtask-1a--spanish/normalized/dataset_dev.tsv',
'test': 'data/subtask-1a--spanish/dataset_test_participants.tsv',
},
'bulgarian': {
'train': 'data/subtask-1a--bulgarian/folds',
'dev': 'data/subtask-1a--bulgarian/dataset_dev_v1_bulgarian.tsv',
'test': 'data/subtask-1a--bulgarian/dataset_test_input_bulgarian.tsv',
},
'arabic': {
'train': 'data/subtask-1a--arabic/folds',
'dev': 'data/subtask-1a--arabic/normalized/dev.tsv',
'test': 'data/subtask-1a--arabic/CT21-AR-Test-T1.tsv',
}
}
LANGS_IDS = {
'english': 0,
'turkish': 1,
'spanish': 2,
'bulgarian': 3,
'arabic': 4
}