14#include <boost/function.hpp>
23#include <boost/dynamic_bitset.hpp>
58 std::vector<int> reqElements = {},
59 std::string connSmarts =
"");
87 const ROMol &mol,
const std::vector<SubstructTerm> &terms =
106 const ROMol &mol,
const std::vector<SubstructTerm> &terms,
107 const std::vector<size_t> &relevantIndices);
131 return [relevantIndices](
const ROMol &taut) {
151 Tautomer() : d_numModifiedAtoms(0), d_numModifiedBonds(0), d_done(false) {}
155 d_numModifiedAtoms(a),
156 d_numModifiedBonds(b),
162 d_numModifiedAtoms(a),
163 d_numModifiedBonds(b),
178 size_t d_numModifiedAtoms;
179 size_t d_numModifiedBonds;
204 return (d_it == other.d_it);
207 return !(*
this == other);
229 SmilesTautomerMap::const_iterator d_it;
233 : d_tautomers(other.d_tautomers),
234 d_status(other.d_status),
235 d_modifiedAtoms(other.d_modifiedAtoms),
236 d_modifiedBonds(other.d_modifiedBonds) {
237 fillTautomersItVec();
243 size_t size()
const {
return d_tautomers.size(); }
244 bool empty()
const {
return d_tautomers.empty(); }
246 PRECONDITION(pos < d_tautomers.size(),
"index out of bounds");
247 return d_tautomersItVec.at(pos)->second.tautomer;
251 return d_modifiedAtoms;
254 return d_modifiedBonds;
258 std::vector<ROMOL_SPTR> tautomerVec;
259 tautomerVec.reserve(d_tautomers.size());
261 d_tautomers.begin(), d_tautomers.end(), std::back_inserter(tautomerVec),
266 std::vector<std::string>
smiles()
const {
267 std::vector<std::string> smilesVec;
268 smilesVec.reserve(d_tautomers.size());
269 std::transform(d_tautomers.begin(), d_tautomers.end(),
270 std::back_inserter(smilesVec),
277 void fillTautomersItVec() {
278 for (
auto it = d_tautomers.begin(); it != d_tautomers.end(); ++it) {
279 d_tautomersItVec.push_back(it);
283 SmilesTautomerMap d_tautomers;
286 std::vector<SmilesTautomerMap::const_iterator> d_tautomersItVec;
289 TautomerEnumeratorStatus d_status;
291 boost::dynamic_bitset<> d_modifiedAtoms;
293 boost::dynamic_bitset<> d_modifiedBonds;
306 : dp_catalog(tautCat),
307 d_maxTautomers(1000),
308 d_maxTransforms(1000),
309 d_removeSp3Stereo(true),
310 d_removeBondStereo(true),
311 d_removeIsotopicHs(true),
312 d_reassignStereo(true) {}
315 : dp_catalog(other.dp_catalog),
316 d_callback(other.d_callback),
317 d_maxTautomers(other.d_maxTautomers),
318 d_maxTransforms(other.d_maxTransforms),
319 d_removeSp3Stereo(other.d_removeSp3Stereo),
320 d_removeBondStereo(other.d_removeBondStereo),
321 d_removeIsotopicHs(other.d_removeIsotopicHs),
322 d_reassignStereo(other.d_reassignStereo) {}
324 if (
this == &other) {
327 dp_catalog = other.dp_catalog;
328 d_callback = other.d_callback;
329 d_maxTautomers = other.d_maxTautomers;
330 d_maxTransforms = other.d_maxTransforms;
331 d_removeSp3Stereo = other.d_removeSp3Stereo;
332 d_removeBondStereo = other.d_removeBondStereo;
333 d_removeIsotopicHs = other.d_removeIsotopicHs;
334 d_reassignStereo = other.d_reassignStereo;
339 d_maxTautomers = maxTautomers;
349 d_maxTransforms = maxTransforms;
361 d_removeSp3Stereo = removeSp3Stereo;
375 d_removeBondStereo = removeBondStereo;
385 d_removeIsotopicHs = removeIsotopicHs;
396 d_reassignStereo = reassignStereo;
408 d_callback.reset(callback);
438 "please use the form returning a TautomerEnumeratorResult "
439 "instead")]] std::vector<ROMOL_SPTR>
441 boost::dynamic_bitset<> *modifiedBonds =
nullptr)
const;
445 boost::function<
int(
const ROMol &mol)> scoreFunc =
452 template <
class Iterable,
453 typename std::enable_if<
454 !std::is_same<Iterable, TautomerEnumeratorResult>::value,
457 boost::function<
int(
const ROMol &mol)> scoreFunc =
460 if (tautomers.size() == 1) {
461 bestMol = *tautomers.begin();
464 int bestScore = std::numeric_limits<int>::min();
465 std::string bestSmiles =
"";
466 for (
const auto &t : tautomers) {
467 auto score = scoreFunc(*t);
468#ifdef VERBOSE_ENUMERATION
469 std::cerr <<
" " <<
MolToSmiles(*t) <<
" " << score << std::endl;
471 if (score > bestScore) {
475 }
else if (score == bestScore) {
477 if (smiles < bestSmiles) {
485 static const bool cleanIt =
true;
486 static const bool force =
true;
509 boost::function<
int(
const ROMol &mol)> scoreFunc = {})
const;
511 RWMol &mol, boost::function<
int(
const ROMol &mol)> scoreFunc = {})
const;
514 bool setTautomerStereoAndIsoHs(
const ROMol &mol,
ROMol &taut,
516 std::shared_ptr<TautomerCatalog> dp_catalog;
517 std::shared_ptr<TautomerEnumeratorCallback> d_callback;
518 unsigned int d_maxTautomers;
519 unsigned int d_maxTransforms;
520 bool d_removeSp3Stereo;
521 bool d_removeBondStereo;
522 bool d_removeIsotopicHs;
523 bool d_reassignStereo;
#define PRECONDITION(expr, mess)
Defines the CleanupParameters and some convenience functions.
virtual bool operator()(const ROMol &, const TautomerEnumeratorResult &)=0
virtual ~TautomerEnumeratorCallback()
TautomerEnumeratorCallback()
const_iterator & operator++()
const_iterator operator--(int)
const ROMOL_SPTR & reference
pointer operator->() const
std::ptrdiff_t difference_type
std::bidirectional_iterator_tag iterator_category
reference operator*() const
bool operator!=(const const_iterator &other) const
const_iterator operator++(int)
bool operator==(const const_iterator &other) const
const_iterator(const SmilesTautomerMap::const_iterator &it)
const_iterator & operator--()
Contains results of tautomer enumeration.
friend class TautomerEnumerator
const SmilesTautomerMap & smilesTautomerMap() const
const boost::dynamic_bitset & modifiedBonds() const
TautomerEnumeratorResult()
const boost::dynamic_bitset & modifiedAtoms() const
const const_iterator end() const
const const_iterator begin() const
const ROMOL_SPTR & operator[](size_t pos) const
std::vector< ROMOL_SPTR > tautomers() const
TautomerEnumeratorResult(const TautomerEnumeratorResult &other)
std::vector< ROMOL_SPTR > operator()() const
const ROMOL_SPTR & at(size_t pos) const
std::vector< std::string > smiles() const
TautomerEnumeratorStatus status() const
void setRemoveSp3Stereo(bool removeSp3Stereo)
TautomerEnumerator(const CleanupParameters ¶ms=CleanupParameters())
bool getRemoveBondStereo()
void setRemoveIsotopicHs(bool removeIsotopicHs)
bool getRemoveSp3Stereo()
unsigned int getMaxTransforms()
std::vector< ROMOL_SPTR > enumerate(const ROMol &mol, boost::dynamic_bitset<> *modifiedAtoms, boost::dynamic_bitset<> *modifiedBonds=nullptr) const
ROMol * pickCanonical(const TautomerEnumeratorResult &tautRes, boost::function< int(const ROMol &mol)> scoreFunc=TautomerScoringFunctions::scoreTautomer) const
returns the canonical tautomer from a TautomerEnumeratorResult
TautomerEnumeratorCallback * getCallback() const
bool getRemoveIsotopicHs()
TautomerEnumerator(TautomerCatalog *tautCat)
void setReassignStereo(bool reassignStereo)
void setRemoveBondStereo(bool removeBondStereo)
TautomerEnumeratorResult enumerate(const ROMol &mol) const
returns a TautomerEnumeratorResult structure for the input molecule
TautomerEnumerator & operator=(const TautomerEnumerator &other)
unsigned int getMaxTautomers()
void canonicalizeInPlace(RWMol &mol, boost::function< int(const ROMol &mol)> scoreFunc={}) const
void setCallback(TautomerEnumeratorCallback *callback)
ROMol * canonicalize(const ROMol &mol, boost::function< int(const ROMol &mol)> scoreFunc={}) const
returns the canonical tautomer for a molecule
TautomerEnumerator(const TautomerEnumerator &other)
void setMaxTransforms(unsigned int maxTransforms)
void setMaxTautomers(unsigned int maxTautomers)
ROMol * pickCanonical(const Iterable &tautomers, boost::function< int(const ROMol &mol)> scoreFunc=TautomerScoringFunctions::scoreTautomer) const
Tautomer(ROMOL_SPTR t, ROMOL_SPTR k, size_t a=0, size_t b=0)
friend class TautomerEnumerator
Tautomer(ROMOL_SPTR t, size_t a=0, size_t b=0)
const ROMOL_SPTR & getKekulized() const
RWMol is a molecule class that is intended to be edited.
#define RDKIT_MOLSTANDARDIZE_EXPORT
RDKIT_GRAPHMOL_EXPORT void assignStereochemistry(ROMol &mol, bool cleanIt=false, bool force=false, bool flagPossibleStereoCenters=false)
Assign stereochemistry tags to atoms and bonds.
RDKIT_GRAPHMOL_EXPORT void Kekulize(RWMol &mol, bool markAtomsBonds=true, bool canonical=true, unsigned int maxBackTracks=100)
Kekulizes the molecule.
RDKIT_MOLSTANDARDIZE_EXPORT int scoreHeteroHs(const ROMol &mol)
RDKIT_MOLSTANDARDIZE_EXPORT std::vector< size_t > getRelevantSubstructTermIndices(const ROMol &mol, const std::vector< SubstructTerm > &terms=getDefaultTautomerScoreSubstructs())
RDKIT_MOLSTANDARDIZE_EXPORT int scoreSubstructsFiltered(const ROMol &mol, const std::vector< SubstructTerm > &terms, const std::vector< size_t > &relevantIndices)
int scoreTautomer(const ROMol &mol)
const std::string tautomerScoringVersion
RDKIT_MOLSTANDARDIZE_EXPORT const std::vector< SubstructTerm > & getDefaultTautomerScoreSubstructs()
RDKIT_MOLSTANDARDIZE_EXPORT int scoreRings(const ROMol &mol)
RDKIT_MOLSTANDARDIZE_EXPORT int scoreSubstructs(const ROMol &mol, const std::vector< SubstructTerm > &terms=getDefaultTautomerScoreSubstructs())
scoreSubstructs scores the molecule based on the substructure definitions
boost::function< int(const ROMol &)> makeOptimizedScorer(const ROMol &mol)
RDKIT_MOLSTANDARDIZE_EXPORT const TautomerTransformDefs defaultTautomerTransformsv1
std::map< std::string, Tautomer > SmilesTautomerMap
TautomerEnumerator * tautomerEnumeratorFromParams(const CleanupParameters ¶ms)
TautomerEnumerator * getV1TautomerEnumerator()
RDCatalog::HierarchCatalog< TautomerCatalogEntry, TautomerCatalogParams, int > TautomerCatalog
std::pair< std::string, Tautomer > SmilesTautomerPair
RDKIT_SMILESPARSE_EXPORT std::string MolToSmiles(const ROMol &mol, const SmilesWriteParams ¶ms)
returns canonical SMILES for a molecule
boost::shared_ptr< ROMol > ROMOL_SPTR
SubstructTerm(const SubstructTerm &rhs)=default
RWMol connectivityMatcher
std::string connectivitySmarts
SubstructTerm(std::string aname, std::string asmarts, int ascore, std::vector< int > reqElements={}, std::string connSmarts="")
bool operator==(const SubstructTerm &rhs) const
std::vector< int > requiredElements