-
Notifications
You must be signed in to change notification settings - Fork 24
/
Copy pathcount_undefined_stereocenters.py
executable file
·34 lines (25 loc) · 1.32 KB
/
count_undefined_stereocenters.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
#!/usr/bin/env python3
__author__ = 'pavel'
import argparse
from gen_stereo_rdkit import get_unspec_double_bonds
from rdkit import Chem
from read_input import read_input
def main():
parser = argparse.ArgumentParser(description='Generation of stereoisomers with RDKit.')
parser.add_argument('-i', '--input', metavar='input.sdf', required=True,
help='input file in SDF or SMILES format. SMILES input should have no header, '
'the first column is SMILES string and the second column with ID is optional.')
parser.add_argument('--no_tetrahedral', required=False, action='store_true', default=False,
help='do not count stereoisomers for unspecified tetrahedral centers.')
parser.add_argument('--no_double_bond', required=False, action='store_true', default=False,
help='do not count stereoisomers for unspecified double bonds.')
args = parser.parse_args()
for mol, mol_name in read_input(args.input):
undef = 0
if not args.no_tetrahedral:
undef += sum(i[1] == '?' for i in Chem.FindMolChiralCenters(mol, includeUnassigned=True))
if not args.no_double_bond:
undef += len(get_unspec_double_bonds(mol))
print(f'{mol_name}\t{undef}')
if __name__ == '__main__':
main()