mirror of
https://github.com/rdkit/rdkit.git
synced 2026-06-05 22:04:27 +08:00
* copy in, get building, add some basic tests * complete the testing Except for regiosiomers, which do not work * regioisomers work now * backup commit; things work * remove last of NM macros from hashfunctions.cpp * remove last of NM macros from hashfunctions.cpp * remove dependency on the abstraction layer * typo * start using namespaces clang-format * switch to using enums for the HashFunctions and StripTypes * Add initial python wrapper (and tests) * move the new hashing code to the MolHash library still may want to revise the naming of this * Setup deprecation of the older hashing code * better release notes text * change in response to review
76 lines
3.1 KiB
C++
76 lines
3.1 KiB
C++
//
|
|
// Copyright (C) 2014 Novartis Institutes for BioMedical Research
|
|
//
|
|
// @@ All Rights Reserved @@
|
|
// This file is part of the RDKit.
|
|
// The contents are covered by the terms of the BSD license
|
|
// which is included in the file license.txt, found at the root
|
|
// of the RDKit source tree.
|
|
//
|
|
#include <RDBoost/python.h>
|
|
#include <GraphMol/ROMol.h>
|
|
#include <GraphMol/MolHash/MolHash.h>
|
|
#include <RDBoost/Wrap.h>
|
|
|
|
namespace python = boost::python;
|
|
using namespace RDKit;
|
|
|
|
namespace {
|
|
std::string GenMolHashString(const ROMol &mol, python::object atomsToUse,
|
|
python::object bondsToUse) {
|
|
std::unique_ptr<std::vector<unsigned>> avect;
|
|
if (atomsToUse) {
|
|
avect = pythonObjectToVect(atomsToUse,
|
|
static_cast<unsigned>(mol.getNumAtoms()));
|
|
}
|
|
std::unique_ptr<std::vector<unsigned>> bvect;
|
|
if (bondsToUse) {
|
|
bvect = pythonObjectToVect(bondsToUse,
|
|
static_cast<unsigned>(mol.getNumBonds()));
|
|
}
|
|
std::string res =
|
|
MolHash::generateMoleculeHashSet(mol, avect.get(), bvect.get());
|
|
return res;
|
|
}
|
|
|
|
std::string MolHashHelper(const ROMol &mol, MolHash::HashFunction func) {
|
|
RWMol cpy(mol);
|
|
return MolHash::MolHash(&cpy, func);
|
|
}
|
|
} // namespace
|
|
|
|
BOOST_PYTHON_MODULE(rdMolHash) {
|
|
python::scope().attr("__doc__") =
|
|
"Module containing functions to generate hashes for molecules";
|
|
|
|
python::enum_<MolHash::HashFunction>("HashFunction")
|
|
.value("AnonymousGraph", MolHash::HashFunction::AnonymousGraph)
|
|
.value("ElementGraph", MolHash::HashFunction::ElementGraph)
|
|
.value("CanonicalSmiles", MolHash::HashFunction::CanonicalSmiles)
|
|
.value("MurckoScaffold", MolHash::HashFunction::MurckoScaffold)
|
|
.value("ExtendedMurcko", MolHash::HashFunction::ExtendedMurcko)
|
|
.value("MolFormula", MolHash::HashFunction::MolFormula)
|
|
.value("AtomBondCounts", MolHash::HashFunction::AtomBondCounts)
|
|
.value("DegreeVector", MolHash::HashFunction::DegreeVector)
|
|
.value("Mesomer", MolHash::HashFunction::Mesomer)
|
|
.value("HetAtomTautomer", MolHash::HashFunction::HetAtomTautomer)
|
|
.value("HetAtomProtomer", MolHash::HashFunction::HetAtomProtomer)
|
|
.value("RedoxPair", MolHash::HashFunction::RedoxPair)
|
|
.value("Regioisomer", MolHash::HashFunction::Regioisomer)
|
|
.value("NetCharge", MolHash::HashFunction::NetCharge)
|
|
.value("SmallWorldIndexBR", MolHash::HashFunction::SmallWorldIndexBR)
|
|
.value("SmallWorldIndexBRL", MolHash::HashFunction::SmallWorldIndexBRL)
|
|
.value("ArthorSubstructureOrder",
|
|
MolHash::HashFunction::ArthorSubstructureOrder);
|
|
|
|
std::string docString = "DEPRECATED: please use MolHash() instead";
|
|
python::def("GenerateMoleculeHashString", GenMolHashString,
|
|
(python::arg("mol"), python::arg("atomsToUse") = python::list(),
|
|
python::arg("bondsToUse") = python::list()),
|
|
docString.c_str());
|
|
python::def("MolHash", MolHashHelper,
|
|
(python::arg("mol"), python::arg("func")),
|
|
"Generate a hash for a molecule. The func argument determines "
|
|
"which hash is generated.");
|
|
}
|