Skip to content

Commit

Permalink
added example data pipeline TOML file
Browse files Browse the repository at this point in the history
  • Loading branch information
Löffler, Hannes committed Jul 10, 2024
1 parent 1875d40 commit e383f5e
Showing 1 changed file with 24 additions and 0 deletions.
24 changes: 24 additions & 0 deletions configs/toml/data_pipeline.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
# Input example for the REINVENT4 data pipeline

input_csv_file = "test.csv"
smiles_column = "SMILES"
separator = "\t"
output_smiles_file = "processed.smi"
num_procs = 1
chunk_size = 500

[filter]
elements = ["I", "O", "Cl", "N", "C", "F", "S", "Br"]
transforms = ["standard"]
min_heavy_atoms = 2
max_heavy_atoms = 90
max_mol_weight = 1200.0
min_carbons = 2
max_num_rings = 12
max_ring_size = 7
keep_stereo = true
keep_isotope_molecules = true
uncharge = true
kekulize = false
randomize_smiles = false
report_errors = false

0 comments on commit e383f5e

Please sign in to comment.