Chemical Data Processing Library C++ API - Version 1.4.0
PatternBasedTautomerizationRule.hpp
Go to the documentation of this file.
1 /*
2  * PatternBasedTautomerizationRule.hpp
3  *
4  * This file is part of the Chemical Data Processing Toolkit
5  *
6  * Copyright (C) 2003 Thomas Seidel <thomas.seidel@univie.ac.at>
7  *
8  * This library is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2 of the License, or (at your option) any later version.
12  *
13  * This library is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public License
19  * along with this library; see the file COPYING. If not, write to
20  * the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
21  * Boston, MA 02111-1307, USA.
22  */
23 
29 #ifndef CDPL_CHEM_PATTERNBASEDTAUTOMERIZATIONRULE_HPP
30 #define CDPL_CHEM_PATTERNBASEDTAUTOMERIZATIONRULE_HPP
31 
32 #include <cstddef>
33 #include <vector>
34 #include <algorithm>
35 #include <iterator>
36 #include <memory>
37 #include <functional>
38 
39 #include "CDPL/Chem/APIPrefix.hpp"
43 #include "CDPL/Util/BitSet.hpp"
45 
46 
47 namespace CDPL
48 {
49 
50  namespace Chem
51  {
52 
63  {
64 
65  public:
67  typedef std::shared_ptr<PatternBasedTautomerizationRule> SharedPointer;
68 
74  {
75 
77  std::size_t atom1ID;
79  std::size_t atom2ID;
82  };
83 
88  PatternBasedTautomerizationRule(unsigned int rule_id);
89 
95 
102 
114  template <typename Iter>
115  void addTransformationPattern(const MolecularGraph::SharedPointer& molgraph, Iter bond_chgs_beg, Iter bond_chgs_end)
116  {
117  structPatterns.push_back(molgraph);
118  patternSubSearchList.push_back(SubstructureSearch::SharedPointer(new SubstructureSearch(*molgraph)));
119  patternBondChangeLists.resize(patternBondChangeLists.size() + 1);
120 
121  std::copy(bond_chgs_beg, bond_chgs_end, std::back_inserter(patternBondChangeLists.back()));
122  }
123 
130 
136 
141 
147  bool setup(MolecularGraph& parent_molgraph);
148 
153  unsigned int getID() const;
154 
160  bool generate(Molecule& tautomer);
161 
167 
168  private:
169  bool applyTransformation(Molecule& tautomer);
170 
171  Atom* getTautomerAtom(Molecule& tautomer, std::size_t ptn_atom_id, const AtomMapping& mapping) const;
172 
173  void freeBitSet(Util::BitSet* bset);
174 
175  void createMatchedBondMask(const BondMapping& mapping, Util::BitSet& bond_mask) const;
176 
177  typedef std::vector<BondOrderChange> BondOrderChangeList;
178  typedef std::vector<BondOrderChangeList> BondOrderChangeListArray;
179  typedef std::vector<MolecularGraph::SharedPointer> StructPatternList;
180  typedef std::vector<SubstructureSearch::SharedPointer> SubstructureSearchList;
181  typedef std::vector<Util::BitSet*> BitSetList;
183 
184  unsigned int ruleID;
185  StructPatternList structPatterns;
186  StructPatternList excludePatterns;
187  BondOrderChangeListArray patternBondChangeLists;
188  SubstructureSearchList patternSubSearchList;
189  SubstructureSearchList excludeSubSearchList;
190  const MolecularGraph* parentMolGraph;
191  std::size_t currPatternIdx;
192  std::size_t currMappingIdx;
193  Util::BitSet bondMask;
194  BitSetList excludeMatches;
195  BitSetCache bitSetCache;
196  };
197  } // namespace Chem
198 } // namespace CDPL
199 
200 #endif // CDPL_CHEM_PATTERNBASEDTAUTOMERIZATIONRULE_HPP
Declaration of type CDPL::Util::BitSet.
Definition of the preprocessor macro CDPL_CHEM_API.
#define CDPL_CHEM_API
Tells the compiler/linker which classes, functions and variables are part of the library API.
Definition of class CDPL::Chem::MolecularGraph.
Definition of class CDPL::Util::ObjectStack.
Definition of class CDPL::Chem::SubstructureSearch.
Definition of class CDPL::Chem::TautomerizationRule.
Data type for the storage and lookup of arbitrary atom to atom mappings.
Definition: AtomMapping.hpp:54
Abstract base class representing a chemical atom and its bonded neighborhood.
Definition: Atom.hpp:57
Data type for the storage and lookup of arbitrary bond to bond mappings.
Definition: BondMapping.hpp:54
Abstract base class for representations of a chemical structure as a graph of bonded atoms.
Definition: MolecularGraph.hpp:57
std::shared_ptr< MolecularGraph > SharedPointer
A reference-counted smart pointer [SHPTR] for dynamically allocated MolecularGraph instances.
Definition: MolecularGraph.hpp:63
Abstract base class representing a mutable molecular graph that owns its atoms and bonds.
Definition: Molecule.hpp:53
SMARTS-pattern-based implementation of a Chem::TautomerizationRule.
Definition: PatternBasedTautomerizationRule.hpp:63
PatternBasedTautomerizationRule(unsigned int rule_id)
Constructs the PatternBasedTautomerizationRule instance with the given rule identifier.
void addExcludePattern(const MolecularGraph::SharedPointer &molgraph)
Registers an exclude pattern: when this substructure is present in the parent molecular graph,...
void addExcludePatterns(const PatternBasedTautomerizationRule &rule)
Copies all exclude patterns of rule into this rule.
PatternBasedTautomerizationRule(const PatternBasedTautomerizationRule &rule)
Constructs a copy of the PatternBasedTautomerizationRule instance rule.
void addTransformationPattern(const MolecularGraph::SharedPointer &molgraph, Iter bond_chgs_beg, Iter bond_chgs_end)
Registers a new transformation pattern together with the associated bond-order changes.
Definition: PatternBasedTautomerizationRule.hpp:115
void clearExcludePatterns()
Removes all registered exclude patterns.
unsigned int getID() const
Returns the rule identifier supplied at construction.
bool setup(MolecularGraph &parent_molgraph)
Prepares the rule for tautomer enumeration on parent_molgraph.
std::shared_ptr< PatternBasedTautomerizationRule > SharedPointer
A reference-counted smart pointer [SHPTR] for dynamically allocated PatternBasedTautomerizationRule i...
Definition: PatternBasedTautomerizationRule.hpp:67
TautomerizationRule::SharedPointer clone() const
Creates and returns a deep copy of this rule.
PatternBasedTautomerizationRule & operator=(const PatternBasedTautomerizationRule &rule)
Replaces the state of this rule by a copy of the state of rule.
bool generate(Molecule &tautomer)
Writes the next tautomer reachable from the parent molecular graph into tautomer.
Subgraph-isomorphism search of a query molecular graph against a target molecular graph,...
Definition: SubstructureSearch.hpp:74
std::shared_ptr< SubstructureSearch > SharedPointer
A reference-counted smart pointer [SHPTR] for dynamically allocated SubstructureSearch instances.
Definition: SubstructureSearch.hpp:86
Abstract base class for all tautomerization rule implementations used by the Chem::TautomerGenerator.
Definition: TautomerizationRule.hpp:50
std::shared_ptr< TautomerizationRule > SharedPointer
A reference-counted smart pointer [SHPTR] for dynamically allocated TautomerizationRule instances.
Definition: TautomerizationRule.hpp:54
boost::dynamic_bitset BitSet
Dynamic bitset class.
Definition: BitSet.hpp:46
The namespace of the Chemical Data Processing Library.
Encodes a single bond-order change between two pattern atoms applied when the parent transformation p...
Definition: PatternBasedTautomerizationRule.hpp:74
std::size_t atom1ID
Pattern-atom ID of the first atom of the bond whose order changes.
Definition: PatternBasedTautomerizationRule.hpp:77
std::size_t atom2ID
Pattern-atom ID of the second atom of the bond whose order changes.
Definition: PatternBasedTautomerizationRule.hpp:79
long orderChange
Signed bond-order delta applied to the matched bond (positive = increase, negative = decrease).
Definition: PatternBasedTautomerizationRule.hpp:81