Files
rdkit/Code/GraphMol/ChemReactions/PreprocessRxn.cpp
Brian Kelley fa89438358 Dev/reaction enumeration (#1111)
* Adds C++ Enumeration Engine to the RDKit

* Adds Sanitization helpers, wrappers and tests

* Clang format

* Remove unused enumerationStateOnly flag

* Fixes docStrings to current API

* Adds doc strings

* Removes RGroupPosition, adds getPosition to EnumerationBase

* Fixes readability.

* Adds EnumerateLibraryBase::reset and getReaction

* Added getReagents method to EnumerateLibrary

* Make the tests have the same naming

* Need to save the initial state for resetting.

* Stupid case-insensitive file systems

* Moves ResetState to EnumerateLibraryBase

* Adds removeNonmatchingReagents helper

* Renames currentPosition to getPosition

* Adds Enumeration Toolkit tutorial

* Fixes Python3 serialization and enumerators

* Verified to run on python2 and 3

* Fixes integer issues on windows

* The number of enumeration should be unsigned.

* Adds deserialization constructor

* Moves boost_serialization to the end

* Deprecates Clone in favor of copy

* Update tests to use copy.copy not Clone

* Move RGROUPS and BBS into an EnumerationTypes namespace

* Make sure old pickles work

* Adds pickle for backwards compatibility

* Moves to uint64_t from size_t for public api

* Whups, accidentally used the binary archiver.

* Commits boost 1.55 serialization

* Makes serialization turnoffable Like Filter Catalog

* Fixes tests when serialization not available.  Adds more enumeration strategy tests

* Fixes a syntax error on some versions of python

* Fixes sanitizeRxn to actually make proper RGroup atoms

* Updates SanitizeRXN python API

* Updates Enumeration API to a parameter class - fixes reagent removal

* Adds a mess of tests

* Change stats to return a string.

* Exposes EvenPairSamplingStrategy Stats to python

* Fixes a crash bug in SanitizeRxn

* Adds better testing of the even pair sampling

* Fixes namespace

* One more try to fix gcc

* Enum classes are c++11 and a microsoft extension.

* Fix typo

* Fixes np.median for python3

* Fixes atom iterators

* Adds virtual tags to derived virtual functions (for clarity)

* Fixes size comparison issues

* Adds doc string

* Small cleanup (has no effect since flags aren’t used)

* fixes crash bug on windows

* get the tests working on windows

* Updates tutorial

* Adds Glare implementation to Contrib
2016-11-05 14:42:52 +01:00

106 lines
4.1 KiB
C++

//
// Copyright (c) 2016, Novartis Institutes for BioMedical Research Inc.
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following
// disclaimer in the documentation and/or other materials provided
// with the distribution.
// * Neither the name of Novartis Institutes for BioMedical Research Inc.
// nor the names of its contributors may be used to endorse or promote
// products derived from this software without specific prior written
// permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
#include "PreprocessRxn.h"
#include "ReactionParser.h"
#include <GraphMol/SmilesParse/SmilesParse.h>
#include <RDGeneral/BoostStartInclude.h>
#include <boost/shared_ptr.hpp>
#include <boost/thread/once.hpp>
#include <RDGeneral/BoostEndInclude.h>
#include <GraphMol/FilterCatalog/FunctionalGroupHierarchy.h>
namespace RDKit {
bool preprocessReaction(ChemicalReaction &rxn,
const std::string &propName)
{
const bool normalized=true;
return preprocessReaction(rxn,
GetFlattenedFunctionalGroupHierarchy(normalized),
propName);
}
bool preprocessReaction(ChemicalReaction &rxn,
unsigned int &numWarnings,
unsigned int &numErrors,
std::vector<
std::vector<std::pair<unsigned int,std::string> > >&reactantLabels,
const std::string &propName)
{
const bool normalized = true;
return preprocessReaction(rxn,
numWarnings,
numErrors,
reactantLabels,
GetFlattenedFunctionalGroupHierarchy(normalized),
propName);
}
bool preprocessReaction(ChemicalReaction &rxn,
const std::map<std::string, ROMOL_SPTR> &queries,
const std::string &propName) {
unsigned int numWarnings, numErrors;
std::vector<
std::vector<std::pair<unsigned int,std::string> > >reactantLabels;
return preprocessReaction(rxn,
numWarnings,
numErrors,
reactantLabels,
queries,
propName);
}
bool preprocessReaction(ChemicalReaction &rxn,
unsigned int &numWarnings,
unsigned int &numErrors,
std::vector<
std::vector<std::pair<unsigned int,std::string> > >&reactantLabels,
const std::map<std::string, ROMOL_SPTR> &queries,
const std::string &propName) {
rxn.setImplicitPropertiesFlag(true);
rxn.initReactantMatchers();
if (rxn.validate(numWarnings, numErrors)) {
addRecursiveQueriesToReaction(rxn,
queries,
propName,
&reactantLabels);
return true;
}
return false;
}
}