Files
rdkit/External/pubchem_shape/Wrap/cshapealign.cpp
David Cosgrove 21b3c4e6f1 Shape overlay initial start aligned to principal axes (#8999)
* Add MolTransforms library.

* Transform to inertial frame of reference before overlay.

* Vital fix of typo in comment.

* Tidy up debugging cruft.

* Comment in CMakeLists.txt.

* Fix python wrappers.

* Extra tidy.

* Response to review.

* Tidy includes.

---------

Co-authored-by: David Cosgrove <david@cozchemix.co.uk>
2025-12-20 08:35:28 +01:00

527 lines
19 KiB
C++

/*******************************************************************************
Copyright 2024 by Greg Landrum and the pubchem_shape contributors
This file is part of pubchem_shape
Permission is hereby granted, free of charge, to any person obtaining a copy of
this software and associated documentation files (the "Software"), to deal in
the Software without restriction, including without limitation the rights to
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software is furnished to do so,
subject to the following conditions:
The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
***********************************************************************/
#include <boost/python.hpp>
#include <vector>
#include "../PubChemShape.hpp"
#include <GraphMol/RDKitBase.h>
#include <RDBoost/Wrap.h>
namespace python = boost::python;
namespace helpers {
python::tuple alignMol(const RDKit::ROMol &ref, RDKit::ROMol &probe,
int refConfId, int probeConfId, bool useColors,
double opt_param, unsigned int max_preiters,
unsigned int max_postiters) {
std::vector<float> matrix(12, 0.0);
auto [nbr_st, nbr_ct] =
AlignMolecule(ref, probe, matrix, refConfId, probeConfId, useColors,
opt_param, max_preiters, max_postiters);
return python::make_tuple(nbr_st, nbr_ct);
}
python::tuple alignMol3(const RDKit::ROMol &ref, RDKit::ROMol &probe,
const ShapeInputOptions &refShapeOpts,
const ShapeInputOptions &probeShapeOpts, int refConfId,
int probeConfId, double opt_param,
unsigned int max_preiters, unsigned int max_postiters) {
std::vector<float> matrix(12, 0.0);
auto [nbr_st, nbr_ct] =
AlignMolecule(ref, probe, matrix, refShapeOpts, probeShapeOpts, refConfId,
probeConfId, opt_param, max_preiters, max_postiters);
return python::make_tuple(nbr_st, nbr_ct);
}
python::tuple alignMol2(const ShapeInput &ref, RDKit::ROMol &probe,
int probeConfId, bool useColors, double opt_param,
unsigned int max_preiters, unsigned int max_postiters,
bool applyRefShift) {
std::vector<float> matrix(12, 0.0);
auto [nbr_st, nbr_ct] =
AlignMolecule(ref, probe, matrix, probeConfId, useColors, opt_param,
max_preiters, max_postiters, applyRefShift);
return python::make_tuple(nbr_st, nbr_ct);
}
python::tuple alignShapes(const ShapeInput &refShape, ShapeInput &fitShape,
double opt_param, unsigned int max_preiters,
unsigned int max_postiters) {
std::vector<float> matrix(12, 0.0);
auto [nbr_st, nbr_ct] = AlignShape(refShape, fitShape, matrix, opt_param,
max_preiters, max_postiters);
python::list pyMatrix;
for (auto m : matrix) {
pyMatrix.append(m);
}
return python::make_tuple(nbr_st, nbr_ct, pyMatrix);
}
python::tuple scoreMolecule1(const RDKit::ROMol &mol1, RDKit::ROMol &mol2,
const ShapeInputOptions &mol1ShapeOpts,
const ShapeInputOptions &mol2ShapeOpts,
int mol1ConfId, int mol2ConfId) {
auto [nbr_st, nbr_ct] = ScoreMolecule(mol1, mol2, mol1ShapeOpts,
mol2ShapeOpts, mol1ConfId, mol2ConfId);
return python::make_tuple(nbr_st, nbr_ct);
}
python::tuple scoreMolecule2(const ShapeInput &shape, RDKit::ROMol &mol,
const ShapeInputOptions &molShapeOpts,
int molConfId) {
auto [nbr_st, nbr_ct] = ScoreMolecule(shape, mol, molShapeOpts, molConfId);
return python::make_tuple(nbr_st, nbr_ct);
}
python::tuple scoreShape(const ShapeInput &shape1, ShapeInput &shape2,
bool useColors) {
auto [nbr_st, nbr_ct] = ScoreShape(shape1, shape2, useColors);
return python::make_tuple(nbr_st, nbr_ct);
}
void transformConformer(const python::list &pyFinalTrans,
const python::list &pyFinalRot,
const python::list &pyMatrix, ShapeInput probeShape,
RDKit::Conformer &probeConf) {
std::vector<float> matrix;
pythonObjectToVect<float>(pyMatrix, matrix);
if (matrix.size() != 12) {
throw_value_error(
"The transformation matrix must have 12 values. It had " +
std::to_string(matrix.size()) + ".");
}
std::vector<double> finalTrans;
pythonObjectToVect<double>(pyFinalTrans, finalTrans);
if (finalTrans.size() != 3) {
throw_value_error(
"The final translation vector must have 3 values. It had " +
std::to_string(finalTrans.size()) + ".");
}
std::vector<double> finalRot;
pythonObjectToVect<double>(pyFinalRot, finalRot);
if (finalRot.size() != 9) {
throw_value_error("The final rotation vector must have 9 values. It had " +
std::to_string(finalRot.size()) + ".");
}
TransformConformer(finalTrans, finalRot, matrix, probeShape, probeConf);
}
ShapeInput *prepConf(const RDKit::ROMol &mol, int confId,
const python::object &py_opts) {
ShapeInputOptions opts;
if (!py_opts.is_none()) {
opts = python::extract<ShapeInputOptions>(py_opts);
}
return new ShapeInput(PrepareConformer(mol, confId, opts));
}
void set_atomSubset(ShapeInputOptions &opts, const python::object &as) {
pythonObjectToVect<unsigned int>(as, opts.atomSubset);
}
python::tuple get_atomSubset(const ShapeInputOptions &opts) {
python::list py_list;
for (const auto &val : opts.atomSubset) {
py_list.append(val);
}
return python::tuple(py_list);
}
void set_notColorAtoms(ShapeInputOptions &opts, const python::object &nca) {
pythonObjectToVect<unsigned int>(nca, opts.notColorAtoms);
}
python::tuple get_notColorAtoms(const ShapeInputOptions &opts) {
python::list py_list;
for (const auto &val : opts.notColorAtoms) {
py_list.append(val);
}
return python::tuple(py_list);
}
void set_atomRadii(ShapeInputOptions &opts, const python::object &ar) {
int len = python::len(ar);
opts.atomRadii.resize(len);
for (int i = 0; i < len; i++) {
unsigned int atomIdx = python::extract<unsigned int>(ar[i][0]);
double radius = python::extract<double>(ar[i][1]);
opts.atomRadii[i] = std::make_pair(atomIdx, radius);
}
}
python::tuple get_atomRadii(const ShapeInputOptions &opts) {
python::list py_list;
for (const auto &val : opts.atomRadii) {
py_list.append(python::make_tuple(static_cast<int>(val.first), val.second));
}
return python::tuple(py_list);
}
void set_shapeShift(ShapeInput &shp, const python::object &s) {
pythonObjectToVect<double>(s, shp.shift);
}
python::list get_shapeShift(const ShapeInput &shp) {
python::list py_list;
for (const auto &val : shp.shift) {
py_list.append(val);
}
return py_list;
}
python::list get_inertialRot(const ShapeInput &shp) {
python::list py_list;
for (const auto &val : shp.inertialRot) {
py_list.append(val);
}
return py_list;
}
void set_customFeatures(ShapeInputOptions &shp, const python::object &s) {
shp.customFeatures.clear();
auto len = python::len(s);
shp.customFeatures.reserve(len);
for (auto i = 0u; i < len; ++i) {
const auto elem = s[i];
unsigned int featType = python::extract<unsigned int>(elem[0]);
RDGeom::Point3D pos = python::extract<RDGeom::Point3D>(elem[1]);
double radius = python::extract<double>(elem[2]);
shp.customFeatures.emplace_back(featType, pos, radius);
}
}
python::tuple get_customFeatures(const ShapeInputOptions &shp) {
python::list py_list;
for (const auto &val : shp.customFeatures) {
python::list elem;
elem.append(static_cast<int>(std::get<0>(val)));
elem.append(std::get<1>(val));
elem.append(std::get<2>(val));
py_list.append(python::tuple(elem));
}
return python::tuple(py_list);
}
} // namespace helpers
void wrap_pubchemshape() {
RegisterVectorConverter<float>("FloatVector");
RegisterVectorConverter<double>("DoubleVector");
RegisterVectorConverter<unsigned int>("UnsignedIntVector");
python::class_<ShapeInputOptions, boost::noncopyable>("ShapeInputOptions",
"Shape Input Options")
.def_readwrite(
"useColors", &ShapeInputOptions::useColors,
"Whether to use colors (pharmacophore features) in the score. Default=True.")
.def_readwrite(
"includeDummies", &ShapeInputOptions::includeDummies,
"Whether to use dummy atoms in the alignment. Default=False.")
.def_readwrite(
"dummyRadius", &ShapeInputOptions::dummyRadius,
"If using dummy atoms in the alignment, what radius to use for them."
" Default=2.16 (the radius of Xe).")
.add_property(
"atomSubset", &helpers::get_atomSubset, &helpers::set_atomSubset,
"If not empty, use just these atoms in the molecule to form the ShapeInput object.")
.add_property(
"notColorAtoms", &helpers::get_notColorAtoms,
&helpers::set_notColorAtoms,
"Any atoms mentioned here by index should not be used in a color feature.")
.add_property(
"atomRadii", &helpers::get_atomRadii, &helpers::set_atomRadii,
"Non-standard radii to use for the atoms specified by their indices"
" in the molecule. A list of tuples of [int, float].")
.add_property("customFeatures", &helpers::get_customFeatures,
&helpers::set_customFeatures,
"Custom features for the shape.")
.def_readwrite("normalize", &ShapeInputOptions::normalize,
"Whether to normalise the shape by putting into"
"its inertial frame. Default=True.")
.def("__setattr__", &safeSetattr);
python::def(
"AlignMol", &helpers::alignMol,
(python::arg("ref"), python::arg("probe"), python::arg("refConfId") = -1,
python::arg("probeConfId") = -1, python::arg("useColors") = true,
python::arg("opt_param") = 1.0, python::arg("max_preiters") = 10,
python::arg("max_postiters") = 30),
R"DOC(Aligns a probe molecule to a reference molecule. The probe is modified.
Parameters
----------
ref : RDKit.ROMol
Reference molecule
probe : RDKit.ROMol
Probe molecule
refConfId : int, optional
Reference conformer ID (default is -1)
probeConfId : int, optional
Probe conformer ID (default is -1)
useColors : bool, optional
Whether or not to use colors in the scoring (default is True)
opt_param : float, optional
Balance of shape and color for optimization.
0 is only color, 0.5 is equal weight, and 1.0 is only shape.
Default is 1.0.
max_preiters : int, optional
In the two phase optimization, the maximum iterations done on all poses.
max_postiters : int, optional
In the two phase optimization, the maximum iterations during the second phase on
only the best poses from the first phase
Returns
-------
2-tuple of doubles
The results are (shape_score, color_score)
The color_score is zero if opt_param is 1.0.)DOC");
python::def(
"AlignMol", &helpers::alignMol3,
(python::arg("ref"), python::arg("probe"), python::arg("refShapeOpts"),
python::arg("probeShapeOpts"), python::arg("refConfId") = -1,
python::arg("probeConfId") = -1, python::arg("opt_param") = 1.0,
python::arg("max_preiters") = 10, python::arg("max_postiters") = 30),
R"DOC(Aligns a probe molecule to a reference molecule. The probe is modified.
Parameters
----------
ref : RDKit.ROMol
Reference molecule
probe : RDKit.ROMol
Probe molecule
refShapeOpts : ShapeInputOptions
Options for constructing the shape for the reference molecule
probeShapeOpts : ShapeInputOptions
Options for constructing the shape for the probe molecule
refConfId : int, optional
Reference conformer ID (default is -1)
probeConfId : int, optional
Probe conformer ID (default is -1)
opt_param : float, optional
Balance of shape and color for optimization.
0 is only color, 0.5 is equal weight, and 1.0 is only shape.
Default is 1.0.
max_preiters : int, optional
In the two phase optimization, the maximum iterations done on all poses.
max_postiters : int, optional
In the two phase optimization, the maximum iterations during the second phase on
only the best poses from the first phase
Returns
-------
2-tuple of doubles
The results are (shape_score, color_score)
The color_score is zero if opt_param is 1.0.)DOC");
python::def(
"AlignMol", &helpers::alignMol2,
(python::arg("refShape"), python::arg("probe"),
python::arg("probeConfId") = -1, python::arg("useColors") = true,
python::arg("opt_param") = 1.0, python::arg("max_preiters") = 10,
python::arg("max_postiters") = 30, python::arg("applyRefShift") = false),
R"DOC(Aligns a probe molecule to a reference shape. The probe is modified.
Assumes the shapes are both centred on the origin.
Parameters
----------
refShape : ShapeInput
Reference shape
probe : RDKit.ROMol
Probe molecule
probeConfId : int, optional
Probe conformer ID (default is -1)
useColors : bool, optional
Whether or not to use colors in the scoring (default is True)
opt_param : float, optional
Balance of shape and color for optimization.
0 is only color, 0.5 is equal weight, and 1.0 is only shape.
Default is 1.0.
max_preiters : int, optional
In the two phase optimization, the maximum iterations done on all poses.
max_postiters : int, optional
In the two phase optimization, the maximum iterations during the second phase on
only the best poses from the first phase
applyRefShift : bool, optional
If True, apply the reference shape's shift translation to the final
coordinates.
Returns
-------
2-tuple of doubles
The results are (shape_score, color_score)
The color_score is zero if opt_param is 1.0.)DOC");
python::def(
"AlignShapes", &helpers::alignShapes,
(python::arg("refShape"), python::arg("probeShape"),
python::arg("opt_param") = 1.0, python::arg("max_preiters") = 10,
python::arg("max_postiters") = 30),
R"DOC(Aligns a probe shape to a reference shape. The probe is modified.
Parameters
----------
refShape : ShapeInput
Reference shape
probeShape : ShapeInput
Probe shape
opt_param : float, optional
Balance of shape and color for optimization.
0 is only color, 0.5 is equal weight, and 1.0 is only shape
max_preiters : int, optional
In the two phase optimization, the maximum iterations done on all poses.
max_postiters : int, optional
In the two phase optimization, the maximum iterations during the second phase on
only the best poses from the first phase
Returns
-------
3-tuple of double, double, list of doubles
The results are (shape_score, color_score, matrix)
The matrix is a 12-float list giving the transformation matrix that
overlays the probe onto the reference.)DOC");
python::def(
"TransformConformer", &helpers::transformConformer,
(python::arg("finalTrans"), python::arg("matrix"),
python::arg("probeShape"), python::arg("probeConformer")),
R"DOC(Assuming that probeShape has been overlaid onto refShape to give
the supplied transformation matrix, applies that transformation to the
given conformer.
Parameters
----------
finalTrans : list[float * 3]
The final translation to apply to conformer.
matrix: list[float * 12]
The transformation matrix
probeShape : ShapeInput
Probe shape
probeConformer : Conformer
Probe conformer
)DOC");
python::def("PrepareConformer", &helpers::prepConf,
(python::arg("mol"), python::arg("confId") = -1,
python::arg("opts") = python::object()),
R"DOC(Generates a ShapeInput object for a molecule
Parameters
----------
mol : RDKit.ROMol
Reference molecule
confId : int, optional
Conformer ID to use (default is -1)
opts : ShapeInputOptions, optional
Options for Shapeinput
Returns
-------
a ShapeInput for the molecule)DOC",
python::return_value_policy<python::manage_new_object>());
python::class_<ShapeInput, boost::noncopyable>("ShapeInput", python::no_init)
.def_readwrite("coord", &ShapeInput::coord)
.def_readwrite("alpha_vector", &ShapeInput::alpha_vector)
.def_readwrite("atom_type_vector", &ShapeInput::atom_type_vector)
.def_readwrite("volumeAtomIndexVector",
&ShapeInput::volumeAtomIndexVector)
.add_property("shift", &helpers::get_shapeShift, &helpers::set_shapeShift,
"Translation of centre of shape coordinates to origin.")
.add_property(
"inertialRot", &helpers::get_inertialRot,
"Rotation applied to put the shape into its principal axes frame of reference.")
.def_readwrite("sov", &ShapeInput::sov)
.def_readwrite("sof", &ShapeInput::sof);
python::def(
"ScoreMol", &helpers::scoreMolecule1,
(python::arg("mol1"), python::arg("mol2"), python::arg("mol1ShapeOpts"),
python::arg("mol2ShapeOpts"), python::arg("mol1ConfId") = -1,
python::arg("mol2ConfId") = -1),
R"DOC(Calculate the scores between a shape and a molecule without moving them.
Parameters
----------
mol1 : RDKit.ROMol
First molecule
mol2 : RDKit.ROMol
Second molecule
mol1ShapeOptions:
Options for constructing the shape for molecule 1
mol2ShapeOptions:
Options for constructing the shape for molecule 2
mol1ConfId : int, optional
First molecule conformer ID (default is -1)
mol2ConfId : int, optional
Second conformer ID (default is -1)
Returns
-------
2-tuple of doubles
The results are (shape_score, color_score)
The color_score is zero if useColors is False for either of the
shape options)DOC");
python::def(
"ScoreMol", &helpers::scoreMolecule2,
(python::arg("shape"), python::arg("mol"), python::arg("molShapeOpts"),
python::arg("molConfId") = -1),
R"DOC(Calculate the scores between 2 molecules without moving them.
Parameters
----------
shape : ShapeInput
Shape
mol : RDKit.ROMol
Molecule
molShapeOptions:
Options for constructing the shape for molecule
molConfId : int, optional
Molecule conformer ID (default is -1)
Returns
-------
2-tuple of doubles
The results are (shape_score, color_score)
The color_score is zero if shape.useColors is False)DOC");
python::def("ScoreShape", &helpers::scoreShape,
(python::arg("shape1"), python::arg("shape2"),
python::arg("useColors") = false),
R"DOC(Calculate the scores between 2 shapes without moving them.
Parameters
----------
shape1 : ShapeInput
Shape
shape2 : ShapeInput
Shape
useColors : bool
Whether to use colors for the score or not.
Returns
-------
2-tuple of doubles
The results are (shape_score, color_score)
The color_score is zero if useColors is False)DOC");
}
BOOST_PYTHON_MODULE(rdShapeAlign) { wrap_pubchemshape(); }