-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathsmiles_vocab_creator.py
42 lines (35 loc) · 1.25 KB
/
smiles_vocab_creator.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
#!/usr/bin/env python3
"""Export vocabulary of SMILESLanguage from .smi files in directory."""
import argparse
import os
from pytoda.smiles.smiles_language import SMILESLanguage
# define the parser arguments
parser = argparse.ArgumentParser()
parser.add_argument('smi_path', type=str, help='path to a folder with .smi files')
parser.add_argument(
'pretrained_path',
type=str,
help='path to a folder to store the language as text files.',
)
def create_smiles_language(smi_path: str, pretrained_path: str) -> None:
"""
Create a SMILESLanguage object and save it to disk.
Args:
smi_path (str): path to a folder containing .smi files.
pretrained_path (str): directory to store the language as text files.
"""
os.makedirs(pretrained_path, exist_ok=True)
smiles_language = SMILESLanguage()
smiles_language.add_smis(
[
os.path.join(smi_path, smi_filename)
for smi_filename in os.listdir(smi_path)
if smi_filename.endswith('.smi')
]
)
smiles_language.save_pretrained(pretrained_path)
if __name__ == '__main__':
# parse arguments
args = parser.parse_args()
# run the creation and export
create_smiles_language(args.smi_path, args.pretrained_path)