mirror of
https://github.com/rdkit/rdkit.git
synced 2026-06-04 21:54:27 +08:00
* do not use new on loggers * del pointers in testDistGeom * Update Dict hasNonPOD status on bulk update * delete new Dicts in memtest1.cpp * fixes in MolSuppliers and testFMCS * PeriodicTable singleton as unique_ptr * fix EEM_arrays leak * fix leaks in testPBF * fix ParamCollection leak in test UFF * fix leaks in MMFF * clear prop dict before read in in pickler * fix leaks in testFreeSASA * fix leaks in test3D * modernize Dict.h & SmilesParse.cpp * fix leaks in testQuery * fix leaks in testCrystalFF * fix leaks in cxsmilesTest * fix leaks in Catalog & mol cat test * fix leaks in ShapeUtils & tests * fix leaks in testSubgraphs1 * fix leaks testFingerprintGenerators * fix leaks in Catalog/FilterCatalog * fix leaks in graphmolqueryTest * these changes reduce bison parse leaks * fixed leaks in testChirality.cpp * fix leaks + 2 tests in testMolWriter * fix 4m leaks in substructLibraryTest * small improvements to molTautomerTest; still leaks * fix leaks in testRGroupDecomp * fix leaks in test; parser still leaks * fix leaks in itertest * fix 4m leaks in testDepictor * fixes in smatest; still leaking due to parser * fixes in testSLNParse; still leaking due to parser * flex/bison: always add atoms with ownership; smarts error cleanup * fix leaks in testReaction * fix leaks in testSubstructMatch * fix leaks in resMolSupplierTest * fix leaks in testChemTransforms + bug in ChemTransforms * fix leaks in testPickler * fix leaks in testMolTransform * fix leaks in testFragCatalog * fix leak in testSLNParse. Still leaks due to Smiles * fixed most leaks in testMolSupplier * pre bison fix * fix some atom & bond parse problems; others still fail * bison smiles & smarts, atoms & bonds more or less fixed * fix leaks in molopstest.cpp * fix leaks in testFingerprints, MACCS.cpp & AtomPairs.cpp * fix leaks in moldraw2Dtest1 * fix leaks in testDescriptors * fix leaks in testInchi * fix leaks in testUFFForceFieldHelpers * fix leaks in hanoiTest & new_canon.h * fix leaks in testMMFFForceField * fix leaks in graphmolTest1 * fix leaks in testMMFFForceFieldHelpers * fix leaks in testDistGeomHelpers * fix leaks in testMolAlign * initialize occupancy & temp facto with default values * fix leak in TautomerTransform * updated suppressions * fix testStructChecker * fix logging & py tests * fix TautomerTransform class/struct issue * remove misplaced delete in testSLNParse * deinit in testAvalonLib1 * fix Avalon-triggered(?) bug in StructChecker/Pattern.cpp * fix random testMolWriter/Supplier fails - diversify output file names to avoid clashing. - unify Writers close/destruct behavior. - flushing/closing in tests. * use reset in FFs Params.cpp * comments on testMMFFForceField * unrequired 'if's added to mol suppliers * correct cast in FilterCatalog.h * use unique_ptr in MACCS Patterns * remove unrequred if in new_canon * update & move suppressions
187 lines
6.3 KiB
C++
187 lines
6.3 KiB
C++
// $Id$
|
|
//
|
|
// Copyright (c) 2007-2014, Novartis Institutes for BioMedical Research Inc.
|
|
// All rights reserved.
|
|
//
|
|
// Redistribution and use in source and binary forms, with or without
|
|
// modification, are permitted provided that the following conditions are
|
|
// met:
|
|
//
|
|
// * Redistributions of source code must retain the above copyright
|
|
// notice, this list of conditions and the following disclaimer.
|
|
// * Redistributions in binary form must reproduce the above
|
|
// copyright notice, this list of conditions and the following
|
|
// disclaimer in the documentation and/or other materials provided
|
|
// with the distribution.
|
|
// * Neither the name of Novartis Institutes for BioMedical Research Inc.
|
|
// nor the names of its contributors may be used to endorse or promote
|
|
// products derived from this software without specific prior written
|
|
// permission.
|
|
//
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
//
|
|
|
|
#include <GraphMol/ChemReactions/Reaction.h>
|
|
#include <GraphMol/ChemReactions/ReactionParser.h>
|
|
#include <GraphMol/SmilesParse/SmilesParse.h>
|
|
|
|
#include <boost/algorithm/string.hpp>
|
|
#include <vector>
|
|
#include <string>
|
|
#include "ReactionUtils.h"
|
|
|
|
namespace RDKit {
|
|
namespace DaylightParserUtils {
|
|
std::vector<std::string> splitSmartsIntoComponents(
|
|
const std::string &reactText) {
|
|
std::vector<std::string> res;
|
|
unsigned int pos = 0;
|
|
unsigned int blockStart = 0;
|
|
unsigned int level = 0;
|
|
unsigned int inBlock = 0;
|
|
while (pos < reactText.size()) {
|
|
if (reactText[pos] == '(') {
|
|
if (pos == blockStart) {
|
|
inBlock = 1;
|
|
}
|
|
++level;
|
|
} else if (reactText[pos] == ')') {
|
|
if (level == 1 && inBlock) {
|
|
// this closes a block
|
|
inBlock = 2;
|
|
}
|
|
--level;
|
|
} else if (level == 0 && reactText[pos] == '.') {
|
|
if (inBlock == 2) {
|
|
std::string element =
|
|
reactText.substr(blockStart + 1, pos - blockStart - 2);
|
|
res.push_back(element);
|
|
} else {
|
|
std::string element = reactText.substr(blockStart, pos - blockStart);
|
|
res.push_back(element);
|
|
}
|
|
blockStart = pos + 1;
|
|
inBlock = 0;
|
|
}
|
|
++pos;
|
|
}
|
|
if (blockStart < pos) {
|
|
if (inBlock == 2) {
|
|
std::string element =
|
|
reactText.substr(blockStart + 1, pos - blockStart - 2);
|
|
res.push_back(element);
|
|
} else {
|
|
std::string element = reactText.substr(blockStart, pos - blockStart);
|
|
res.push_back(element);
|
|
}
|
|
}
|
|
return res;
|
|
}
|
|
|
|
ROMol *constructMolFromString(const std::string &txt,
|
|
std::map<std::string, std::string> *replacements,
|
|
bool useSmiles) {
|
|
ROMol *mol;
|
|
if (!useSmiles) {
|
|
mol = SmartsToMol(txt, 0, false, replacements);
|
|
} else {
|
|
mol = SmilesToMol(txt, 0, false, replacements);
|
|
}
|
|
return mol;
|
|
}
|
|
|
|
} // end of namespace DaylightParserUtils
|
|
|
|
ChemicalReaction *RxnSmartsToChemicalReaction(
|
|
const std::string &text, std::map<std::string, std::string> *replacements,
|
|
bool useSmiles) {
|
|
std::size_t pos1 = text.find('>');
|
|
std::size_t pos2 = text.rfind('>');
|
|
if (pos1 == std::string::npos) {
|
|
throw ChemicalReactionParserException(
|
|
"a reaction requires at least one reactant and one product");
|
|
}
|
|
if (text.find('>', pos1 + 1) != pos2) {
|
|
throw ChemicalReactionParserException("multi-step reactions not supported");
|
|
}
|
|
|
|
std::string reactText = text.substr(0, pos1);
|
|
std::string agentText;
|
|
if (pos2 != pos1 + 1) {
|
|
agentText = text.substr(pos1 + 1, (pos2 - pos1) - 1);
|
|
}
|
|
std::string productText = text.substr(pos2 + 1);
|
|
|
|
// recognize changes within the same molecules, e.g., intra molecular bond
|
|
// formation
|
|
// therefore we need to correctly interpret parenthesis and dots in the
|
|
// reaction smarts
|
|
std::vector<std::string> reactSmarts =
|
|
DaylightParserUtils::splitSmartsIntoComponents(reactText);
|
|
std::vector<std::string> productSmarts =
|
|
DaylightParserUtils::splitSmartsIntoComponents(productText);
|
|
|
|
auto *rxn = new ChemicalReaction();
|
|
|
|
for (const auto &txt : reactSmarts) {
|
|
ROMol *mol;
|
|
mol = DaylightParserUtils::constructMolFromString(txt, replacements,
|
|
useSmiles);
|
|
if (!mol) {
|
|
std::string errMsg = "Problems constructing reactant from SMARTS: ";
|
|
errMsg += txt;
|
|
delete rxn;
|
|
throw ChemicalReactionParserException(errMsg);
|
|
}
|
|
rxn->addReactantTemplate(ROMOL_SPTR(mol));
|
|
}
|
|
|
|
for (const auto &txt : productSmarts) {
|
|
ROMol *mol;
|
|
mol = DaylightParserUtils::constructMolFromString(txt, replacements,
|
|
useSmiles);
|
|
if (!mol) {
|
|
std::string errMsg = "Problems constructing product from SMARTS: ";
|
|
errMsg += txt;
|
|
delete rxn;
|
|
throw ChemicalReactionParserException(errMsg);
|
|
}
|
|
rxn->addProductTemplate(ROMOL_SPTR(mol));
|
|
}
|
|
updateProductsStereochem(rxn);
|
|
|
|
ROMol *agentMol;
|
|
// allow a reaction template to have no agent specified
|
|
if (agentText.size() != 0) {
|
|
agentMol = DaylightParserUtils::constructMolFromString(
|
|
agentText, replacements, useSmiles);
|
|
if (!agentMol) {
|
|
std::string errMsg = "Problems constructing agent from SMARTS: ";
|
|
errMsg += agentText;
|
|
delete rxn;
|
|
throw ChemicalReactionParserException(errMsg);
|
|
}
|
|
std::vector<ROMOL_SPTR> agents = MolOps::getMolFrags(*agentMol, false);
|
|
delete agentMol;
|
|
for (auto &agent : agents) {
|
|
rxn->addAgentTemplate(agent);
|
|
}
|
|
}
|
|
|
|
// "SMARTS"-based reactions have implicit properties
|
|
rxn->setImplicitPropertiesFlag(true);
|
|
|
|
return rxn;
|
|
}
|
|
}
|