5.1. Single Low-energy 3D Structures
The script gen_3d_structs.py generates a single low energy 3D stucture for each molecule read from the specified input file and writes the resulting structure to the desired output file.
Synopsis
python gen_3d_structs.py [-h] -i <file> -o <file> [-t <int>] [-q]
Mandatory options
- -i <file>
Molecule input file
- -o <file>
Conformer ensemble output file
Other options
- -h, --help
Show help message and exit
- -t <int>
Max. allowed molecule processing time (default: 3600 sec)
- -q
Disable progress output (default: false)
Code
1import sys
2import argparse
3
4import CDPL.Chem as Chem
5import CDPL.ConfGen as ConfGen
6
7
8# generates a low-energy 3D structure of the argument molecule using
9# the provided initialized ConfGen.StructureGenerator instance
10def gen3DStructure(mol: Chem.Molecule, struct_gen: ConfGen.StructureGenerator) -> int:
11 # prepare the molecule for 3D structure generation
12 ConfGen.prepareForConformerGeneration(mol)
13
14 # generate the 3D structure
15 status = struct_gen.generate(mol)
16
17 # if successful, store the generated conformer ensemble as
18 # per atom 3D coordinates arrays (= the way conformers are represented in CDPKit)
19 if status == ConfGen.ReturnCode.SUCCESS:
20 struct_gen.setCoordinates(mol)
21
22 # return status code
23 return status
24
25def parseArgs() -> argparse.Namespace:
26 parser = argparse.ArgumentParser(description='Generates low energy 3D stuctures of the given input molecules.')
27
28 parser.add_argument('-i',
29 dest='in_file',
30 required=True,
31 metavar='<file>',
32 help='Molecule input file')
33 parser.add_argument('-o',
34 dest='out_file',
35 required=True,
36 metavar='<file>',
37 help='Conformer ensemble output file')
38 parser.add_argument('-t',
39 dest='max_time',
40 required=False,
41 metavar='<int>',
42 type=int,
43 default=3600,
44 help='Max. allowed molecule processing time (default: 3600 sec)')
45 parser.add_argument('-q',
46 dest='quiet',
47 required=False,
48 action='store_true',
49 default=False,
50 help='Disable progress output (default: false)')
51
52 return parser.parse_args()
53
54def main() -> None:
55 args = parseArgs()
56
57 # create reader for input molecules (format specified by file extension)
58 reader = Chem.MoleculeReader(args.in_file)
59
60 # create writer for the generated 3D structures (format specified by file extension)
61 writer = Chem.MolecularGraphWriter(args.out_file)
62
63 # export only a single 3D structure (in case of multi-conf. input molecules)
64 Chem.setMultiConfExportParameter(writer, False)
65
66 # create and initialize an instance of the class ConfGen.StructureGenerator which will
67 # perform the actual 3D structure generation work
68 struct_gen = ConfGen.StructureGenerator()
69
70 struct_gen.settings.timeout = args.max_time * 1000 # apply the -t argument
71
72 # dictionary mapping status codes to human readable strings
73 status_to_str = { ConfGen.ReturnCode.UNINITIALIZED : 'uninitialized',
74 ConfGen.ReturnCode.TIMEOUT : 'max. processing time exceeded',
75 ConfGen.ReturnCode.ABORTED : 'aborted',
76 ConfGen.ReturnCode.FORCEFIELD_SETUP_FAILED : 'force field setup failed',
77 ConfGen.ReturnCode.FORCEFIELD_MINIMIZATION_FAILED : 'force field structure refinement failed',
78 ConfGen.ReturnCode.FRAGMENT_LIBRARY_NOT_SET : 'fragment library not available',
79 ConfGen.ReturnCode.FRAGMENT_CONF_GEN_FAILED : 'fragment conformer generation failed',
80 ConfGen.ReturnCode.FRAGMENT_CONF_GEN_TIMEOUT : 'fragment conformer generation timeout',
81 ConfGen.ReturnCode.FRAGMENT_ALREADY_PROCESSED : 'fragment already processed',
82 ConfGen.ReturnCode.TORSION_DRIVING_FAILED : 'torsion driving failed',
83 ConfGen.ReturnCode.CONF_GEN_FAILED : 'conformer generation failed' }
84
85 # create an instance of the default implementation of the Chem.Molecule interface
86 mol = Chem.BasicMolecule()
87 i = 1
88
89 # read and process molecules one after the other until the end of input has been reached
90 try:
91 while reader.read(mol):
92 # compose a simple molecule identifier
93 mol_id = Chem.getName(mol).strip()
94
95 if mol_id == '':
96 mol_id = '#' + str(i) # fallback if name is empty
97 else:
98 mol_id = '\'%s\' (#%s)' % (mol_id, str(i))
99
100 if not args.quiet:
101 print('- Generating 3D structure of molecule %s...' % mol_id)
102
103 try:
104 # generate 3D structure of the read molecule
105 status = gen3DStructure(mol, struct_gen)
106
107 # check for severe error reported by status code
108 if status != ConfGen.ReturnCode.SUCCESS:
109 if args.quiet:
110 print('Error: 3D structure generation for molecule %s failed: %s' % (mol_id, status_to_str[status]))
111 else:
112 print(' -> 3D structure generation failed: %s' % status_to_str[status])
113 else:
114 # enforce the output of 3D coordinates in case of MDL file formats
115 Chem.setMDLDimensionality(mol, 3)
116
117 # output the generated 3D structure
118 if not writer.write(mol):
119 sys.exit('Error: writing 3D structure of molecule %s failed' % mol_id)
120
121 except Exception as e:
122 sys.exit('Error: 3D structure generation or output for molecule %s failed: %s' % (mol_id, str(e)))
123
124 i += 1
125
126 except Exception as e: # handle exception raised in case of severe read errors
127 sys.exit('Error: reading molecule failed: ' + str(e))
128
129 writer.close()
130 sys.exit(0)
131
132if __name__ == '__main__':
133 main()