-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig_vowels.yaml
18 lines (18 loc) · 1.01 KB
/
config_vowels.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
smoke_test: false
rewrites:
dataset_name: "imdb_vowels" # This is used in a factory function to import the dataset template
scoring:
model: "armorm" # Choices: "distilbert_positive", "distilbert_negative", "armorm", "sfairxc", "ncsoft"
dataset_folder: "rewrites" # Choices: "rewrites", "scored"
dataset_filename: "imdb_vowels_dataset_20241118_123149.json"
dataset_name: "imdb_vowels" # Note: used in output filename so update to match the dataset_name below (INCLUDE CONCEPT)
effects:
dataset_name: "imdb_vowels" # Note: this is used to create the filename for the calculated effects
dataset_folder: "typos" # null to load directly from the scored dataset_folder. Or, specifiy a subdirectory
concept: "vowels"
score: "armorm"
w_original_key: "original"
w_counterfactual_key: "rewrite"
w_rewritten_rewrite_key: "rewritten rewrite"
reward_key: "NCSOFT/Llama-3-OffsetBias-RM-8B" # Note: This is the key for the reward in the dataset
dataset_filename: "imdb_vowels_30typos_complete_scored_20241120_162935.jsonl"