mirror of
https://github.com/rdkit/rdkit.git
synced 2026-06-04 21:54:27 +08:00
809 lines
28 KiB
C++
809 lines
28 KiB
C++
//
|
|
// Copyright (C) 2001-2018 Rational Discovery LLC
|
|
//
|
|
// @@ All Rights Reserved @@
|
|
// This file is part of the RDKit.
|
|
// The contents are covered by the terms of the BSD license
|
|
// which is included in the file license.txt, found at the root
|
|
// of the RDKit source tree.
|
|
//
|
|
#include <RDGeneral/test.h>
|
|
#include "AlignMolecules.h"
|
|
#include "O3AAlignMolecules.h"
|
|
#include <GraphMol/FileParsers/MolSupplier.h>
|
|
#include <GraphMol/FileParsers/MolWriters.h>
|
|
#include <GraphMol/FileParsers/FileParsers.h>
|
|
#include <GraphMol/Descriptors/Crippen.h>
|
|
#include <GraphMol/ROMol.h>
|
|
#include <GraphMol/Conformer.h>
|
|
#include <GraphMol/Substruct/SubstructMatch.h>
|
|
#include <Numerics/Vector.h>
|
|
#include <ForceField/ForceField.h>
|
|
#include <GraphMol/ForceFieldHelpers/UFF/Builder.h>
|
|
#include <GraphMol/ForceFieldHelpers/MMFF/Builder.h>
|
|
#include <GraphMol/MolPickler.h>
|
|
#include <GraphMol/DistGeomHelpers/Embedder.h>
|
|
#include <GraphMol/SmilesParse/SmilesParse.h>
|
|
#include <GraphMol/MolTransforms/MolTransforms.h>
|
|
|
|
using namespace RDKit;
|
|
|
|
void testMMFFO3A() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2";
|
|
std::string newSdf = sdf + "_MMFFO3A.sdf";
|
|
sdf += ".sdf";
|
|
SDMolSupplier supplier(sdf, true, false);
|
|
int nMol = supplier.length();
|
|
const int refNum = 48;
|
|
// SDWriter *newMol = new SDWriter(newSdf);
|
|
ROMol *refMol = supplier[refNum];
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
double cumScore = 0.0;
|
|
double cumMsd = 0.0;
|
|
for (int prbNum = 0; prbNum < nMol; ++prbNum) {
|
|
ROMol *prbMol = supplier[prbNum];
|
|
MMFF::MMFFMolProperties prbMP(*prbMol);
|
|
MolAlign::O3A o3a(*prbMol, *refMol, &prbMP, &refMP);
|
|
double rmsd = o3a.align();
|
|
cumScore += o3a.score();
|
|
cumMsd += rmsd * rmsd;
|
|
// newMol->write(prbMol);
|
|
delete prbMol;
|
|
}
|
|
cumMsd /= (double)nMol;
|
|
delete refMol;
|
|
// newMol->close();
|
|
// std::cerr<<cumScore<<","<<sqrt(cumMsd)<<std::endl;
|
|
TEST_ASSERT(RDKit::feq(cumScore, 6941.8, 1));
|
|
TEST_ASSERT(RDKit::feq(sqrt(cumMsd), .345, .001));
|
|
}
|
|
|
|
void testCrippenO3A() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2";
|
|
std::string newSdf = sdf + "_CrippenO3A.sdf";
|
|
sdf += ".sdf";
|
|
SDMolSupplier supplier(sdf, true, false);
|
|
int nMol = supplier.length();
|
|
const int refNum = 48;
|
|
// SDWriter *newMol = new SDWriter(newSdf);
|
|
ROMol *refMol = supplier[refNum];
|
|
unsigned int refNAtoms = refMol->getNumAtoms();
|
|
std::vector<double> refLogpContribs(refNAtoms);
|
|
std::vector<double> refMRContribs(refNAtoms);
|
|
std::vector<unsigned int> refAtomTypes(refNAtoms);
|
|
std::vector<std::string> refAtomTypeLabels(refNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*refMol, refLogpContribs, refMRContribs,
|
|
true, &refAtomTypes, &refAtomTypeLabels);
|
|
double cumScore = 0.0;
|
|
double cumMsd = 0.0;
|
|
for (int prbNum = 0; prbNum < nMol; ++prbNum) {
|
|
ROMol *prbMol = supplier[prbNum];
|
|
unsigned int prbNAtoms = prbMol->getNumAtoms();
|
|
std::vector<double> prbLogpContribs(prbNAtoms);
|
|
std::vector<double> prbMRContribs(prbNAtoms);
|
|
std::vector<unsigned int> prbAtomTypes(prbNAtoms);
|
|
std::vector<std::string> prbAtomTypeLabels(prbNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*prbMol, prbLogpContribs, prbMRContribs,
|
|
true, &prbAtomTypes,
|
|
&prbAtomTypeLabels);
|
|
MolAlign::O3A o3a(*prbMol, *refMol, &prbLogpContribs, &refLogpContribs,
|
|
MolAlign::O3A::CRIPPEN);
|
|
double rmsd = o3a.align();
|
|
cumScore += o3a.score();
|
|
cumMsd += rmsd * rmsd;
|
|
// newMol->write(prbMol);
|
|
delete prbMol;
|
|
}
|
|
cumMsd /= (double)nMol;
|
|
delete refMol;
|
|
// newMol->close();
|
|
// std::cerr<<cumScore<<","<<sqrt(cumMsd)<<std::endl;
|
|
TEST_ASSERT(RDKit::feq(cumScore, 4918.1, 1));
|
|
TEST_ASSERT(RDKit::feq(sqrt(cumMsd), .304, .001));
|
|
}
|
|
|
|
void testMMFFO3AMolHist() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2";
|
|
std::string newSdf = sdf + "_MMFFO3A.sdf";
|
|
sdf += ".sdf";
|
|
SDMolSupplier supplier(sdf, true, false);
|
|
int nMol = supplier.length();
|
|
const int refNum = 48;
|
|
// SDWriter *newMol = new SDWriter(newSdf);
|
|
ROMol *refMol = supplier[refNum];
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
double *refDmat = MolOps::get3DDistanceMat(*refMol);
|
|
MolAlign::MolHistogram refHist(*refMol, refDmat);
|
|
double cumScore = 0.0;
|
|
double cumMsd = 0.0;
|
|
for (int prbNum = 0; prbNum < nMol; ++prbNum) {
|
|
ROMol *prbMol = supplier[prbNum];
|
|
MMFF::MMFFMolProperties prbMP(*prbMol);
|
|
double *prbDmat = MolOps::get3DDistanceMat(*prbMol);
|
|
MolAlign::MolHistogram prbHist(*prbMol, prbDmat);
|
|
|
|
MolAlign::O3A o3a(*prbMol, *refMol, &prbMP, &refMP, MolAlign::O3A::MMFF94,
|
|
-1, -1, false, 50, 0, nullptr, nullptr, nullptr, &prbHist,
|
|
&refHist);
|
|
double rmsd = o3a.align();
|
|
cumScore += o3a.score();
|
|
cumMsd += rmsd * rmsd;
|
|
// newMol->write(prbMol);
|
|
delete prbMol;
|
|
}
|
|
cumMsd /= (double)nMol;
|
|
delete refMol;
|
|
// newMol->close();
|
|
// std::cerr<<cumScore<<","<<sqrt(cumMsd)<<std::endl;
|
|
TEST_ASSERT(RDKit::feq(cumScore, 6941.8, 1));
|
|
TEST_ASSERT(RDKit::feq(sqrt(cumMsd), .345, .001));
|
|
}
|
|
|
|
void testCrippenO3AMolHist() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2";
|
|
std::string newSdf = sdf + "_CrippenO3A.sdf";
|
|
sdf += ".sdf";
|
|
SDMolSupplier supplier(sdf, true, false);
|
|
int nMol = supplier.length();
|
|
const int refNum = 48;
|
|
// SDWriter *newMol = new SDWriter(newSdf);
|
|
ROMol *refMol = supplier[refNum];
|
|
unsigned int refNAtoms = refMol->getNumAtoms();
|
|
std::vector<double> refLogpContribs(refNAtoms);
|
|
std::vector<double> refMRContribs(refNAtoms);
|
|
std::vector<unsigned int> refAtomTypes(refNAtoms);
|
|
std::vector<std::string> refAtomTypeLabels(refNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*refMol, refLogpContribs, refMRContribs,
|
|
true, &refAtomTypes, &refAtomTypeLabels);
|
|
double *refDmat = MolOps::get3DDistanceMat(*refMol);
|
|
MolAlign::MolHistogram refHist(*refMol, refDmat);
|
|
double cumScore = 0.0;
|
|
double cumMsd = 0.0;
|
|
for (int prbNum = 0; prbNum < nMol; ++prbNum) {
|
|
ROMol *prbMol = supplier[prbNum];
|
|
unsigned int prbNAtoms = prbMol->getNumAtoms();
|
|
std::vector<double> prbLogpContribs(prbNAtoms);
|
|
std::vector<double> prbMRContribs(prbNAtoms);
|
|
std::vector<unsigned int> prbAtomTypes(prbNAtoms);
|
|
std::vector<std::string> prbAtomTypeLabels(prbNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*prbMol, prbLogpContribs, prbMRContribs,
|
|
true, &prbAtomTypes,
|
|
&prbAtomTypeLabels);
|
|
double *prbDmat = MolOps::get3DDistanceMat(*prbMol);
|
|
MolAlign::MolHistogram prbHist(*prbMol, prbDmat);
|
|
|
|
MolAlign::O3A o3a(*prbMol, *refMol, &prbLogpContribs, &refLogpContribs,
|
|
MolAlign::O3A::CRIPPEN, -1, -1, false, 50, 0, nullptr,
|
|
nullptr, nullptr, &prbHist, &refHist);
|
|
double rmsd = o3a.align();
|
|
cumScore += o3a.score();
|
|
cumMsd += rmsd * rmsd;
|
|
// newMol->write(prbMol);
|
|
delete prbMol;
|
|
}
|
|
cumMsd /= (double)nMol;
|
|
delete refMol;
|
|
// newMol->close();
|
|
// std::cerr<<cumScore<<","<<sqrt(cumMsd)<<std::endl;
|
|
TEST_ASSERT(RDKit::feq(cumScore, 4918.1, 1));
|
|
TEST_ASSERT(RDKit::feq(sqrt(cumMsd), .304, .001));
|
|
}
|
|
|
|
void testMMFFO3AConstraints() {
|
|
ROMol *m = SmilesToMol("n1ccc(cc1)-c1ccccc1");
|
|
TEST_ASSERT(m);
|
|
ROMol *m1 = MolOps::addHs(*m);
|
|
delete m;
|
|
TEST_ASSERT(m1);
|
|
DGeomHelpers::EmbedMolecule(*m1);
|
|
MMFF::sanitizeMMFFMol((RWMol &)(*m1));
|
|
MMFF::MMFFMolProperties mp(*m1);
|
|
TEST_ASSERT(mp.isValid());
|
|
ForceFields::ForceField *field = MMFF::constructForceField(*m1, &mp);
|
|
field->initialize();
|
|
field->minimize();
|
|
delete field;
|
|
|
|
RWMol *patt = SmartsToMol("nccc-cccc");
|
|
MatchVectType matchVect;
|
|
TEST_ASSERT(SubstructMatch(*m1, (ROMol &)*patt, matchVect));
|
|
delete patt;
|
|
unsigned int nIdx = matchVect[0].second;
|
|
unsigned int cIdx = matchVect[matchVect.size() - 1].second;
|
|
MolTransforms::setDihedralDeg(m1->getConformer(), matchVect[2].second,
|
|
matchVect[3].second, matchVect[4].second,
|
|
matchVect[5].second, 0.0);
|
|
ROMol m2(*m1);
|
|
MolAlign::randomTransform(m2);
|
|
ROMol m3(m2);
|
|
auto *o3a = new MolAlign::O3A(m2, *m1, &mp, &mp);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
double d =
|
|
(m2.getConformer().getAtomPos(cIdx) - m1->getConformer().getAtomPos(cIdx))
|
|
.length();
|
|
TEST_ASSERT(feq(d, 0.0, 1));
|
|
MatchVectType constraintMap;
|
|
constraintMap.push_back(std::make_pair(cIdx, nIdx));
|
|
o3a = new MolAlign::O3A(m3, *m1, &mp, &mp, MolAlign::O3A::MMFF94, -1, -1,
|
|
false, 50, 0, &constraintMap);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
d = (m3.getConformer().getAtomPos(cIdx) - m1->getConformer().getAtomPos(cIdx))
|
|
.length();
|
|
TEST_ASSERT(feq(d, 7.0, 1.0));
|
|
delete m1;
|
|
}
|
|
|
|
void testCrippenO3AConstraints() {
|
|
ROMol *m = SmilesToMol("n1ccc(cc1)-c1ccccc1");
|
|
TEST_ASSERT(m);
|
|
ROMol *m1 = MolOps::addHs(*m);
|
|
delete m;
|
|
TEST_ASSERT(m1);
|
|
DGeomHelpers::EmbedMolecule(*m1);
|
|
MMFF::sanitizeMMFFMol((RWMol &)(*m1));
|
|
MMFF::MMFFMolProperties mp(*m1);
|
|
TEST_ASSERT(mp.isValid());
|
|
ForceFields::ForceField *field = MMFF::constructForceField(*m1, &mp);
|
|
field->initialize();
|
|
field->minimize();
|
|
delete field;
|
|
RWMol *patt = SmartsToMol("nccc-cccc");
|
|
MatchVectType matchVect;
|
|
TEST_ASSERT(SubstructMatch(*m1, (ROMol &)*patt, matchVect));
|
|
delete patt;
|
|
unsigned int nIdx = matchVect[0].second;
|
|
unsigned int cIdx = matchVect[matchVect.size() - 1].second;
|
|
MolTransforms::setDihedralDeg(m1->getConformer(), matchVect[2].second,
|
|
matchVect[3].second, matchVect[4].second,
|
|
matchVect[5].second, 0.0);
|
|
ROMol m2(*m1);
|
|
MolAlign::randomTransform(m2);
|
|
ROMol m3(m2);
|
|
unsigned int prbNAtoms = m2.getNumAtoms();
|
|
std::vector<double> prbLogpContribs(prbNAtoms);
|
|
std::vector<double> prbMRContribs(prbNAtoms);
|
|
std::vector<unsigned int> prbAtomTypes(prbNAtoms);
|
|
std::vector<std::string> prbAtomTypeLabels(prbNAtoms);
|
|
Descriptors::getCrippenAtomContribs(m2, prbLogpContribs, prbMRContribs, true,
|
|
&prbAtomTypes, &prbAtomTypeLabels);
|
|
auto *o3a = new MolAlign::O3A(m2, *m1, &prbLogpContribs, &prbLogpContribs,
|
|
MolAlign::O3A::CRIPPEN);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
double d =
|
|
(m2.getConformer().getAtomPos(cIdx) - m1->getConformer().getAtomPos(cIdx))
|
|
.length();
|
|
TEST_ASSERT(feq(d, 0.0, 1));
|
|
MatchVectType constraintMap;
|
|
constraintMap.push_back(std::make_pair(cIdx, nIdx));
|
|
o3a = new MolAlign::O3A(m3, *m1, &prbLogpContribs, &prbLogpContribs,
|
|
MolAlign::O3A::CRIPPEN, -1, -1, false, 50, 0,
|
|
&constraintMap);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
d = (m3.getConformer().getAtomPos(cIdx) - m1->getConformer().getAtomPos(cIdx))
|
|
.length();
|
|
TEST_ASSERT(feq(d, 7.0, 1.0));
|
|
delete m1;
|
|
}
|
|
|
|
void testMMFFO3AConstraintsAndLocalOnly() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2.sdf";
|
|
SDMolSupplier supplier(sdf, true, false);
|
|
const int refNum = 23;
|
|
const int prbNum = 32;
|
|
ROMol *refMol = supplier[refNum];
|
|
ROMol *prbMol = supplier[prbNum];
|
|
unsigned int refNAtoms = refMol->getNumAtoms();
|
|
std::vector<double> refLogpContribs(refNAtoms);
|
|
std::vector<double> refMRContribs(refNAtoms);
|
|
std::vector<unsigned int> refAtomTypes(refNAtoms);
|
|
std::vector<std::string> refAtomTypeLabels(refNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*refMol, refLogpContribs, refMRContribs,
|
|
true, &refAtomTypes, &refAtomTypeLabels);
|
|
unsigned int prbNAtoms = prbMol->getNumAtoms();
|
|
std::vector<double> prbLogpContribs(prbNAtoms);
|
|
std::vector<double> prbMRContribs(prbNAtoms);
|
|
std::vector<unsigned int> prbAtomTypes(prbNAtoms);
|
|
std::vector<std::string> prbAtomTypeLabels(prbNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*prbMol, prbLogpContribs, prbMRContribs,
|
|
true, &prbAtomTypes, &prbAtomTypeLabels);
|
|
RWMol *patt = SmartsToMol("S");
|
|
MatchVectType matchVect;
|
|
TEST_ASSERT(SubstructMatch(*refMol, (ROMol &)*patt, matchVect));
|
|
delete patt;
|
|
unsigned int refSIdx = matchVect[0].second;
|
|
matchVect.clear();
|
|
patt = SmartsToMol("O");
|
|
TEST_ASSERT(SubstructMatch(*prbMol, (ROMol &)*patt, matchVect));
|
|
delete patt;
|
|
unsigned int prbOIdx = matchVect[0].second;
|
|
std::vector<double> distOS(2);
|
|
distOS[0] = 2.7;
|
|
distOS[1] = 0.4;
|
|
std::vector<double> weights(2);
|
|
weights[0] = 0.1;
|
|
weights[1] = 100.0;
|
|
for (unsigned int i = 0; i < 2; ++i) {
|
|
MatchVectType constraintMap;
|
|
constraintMap.push_back(std::make_pair(prbOIdx, refSIdx));
|
|
RDNumeric::DoubleVector constraintWeights(1);
|
|
constraintWeights[0] = weights[i];
|
|
auto *o3a =
|
|
new MolAlign::O3A(*prbMol, *refMol, &prbLogpContribs, &refLogpContribs,
|
|
MolAlign::O3A::CRIPPEN, -1, -1, false, 50, 0,
|
|
&constraintMap, &constraintWeights);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
o3a = new MolAlign::O3A(*prbMol, *refMol, &prbLogpContribs,
|
|
&refLogpContribs, MolAlign::O3A::CRIPPEN, -1, -1,
|
|
false, 50, MolAlign::O3_LOCAL_ONLY);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
double d = (prbMol->getConformer().getAtomPos(prbOIdx) -
|
|
refMol->getConformer().getAtomPos(refSIdx))
|
|
.length();
|
|
TEST_ASSERT(feq(d, distOS[i], 0.1));
|
|
}
|
|
delete refMol;
|
|
delete prbMol;
|
|
}
|
|
|
|
void testCrippenO3AConstraintsAndLocalOnly() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2.sdf";
|
|
SDMolSupplier supplier(sdf, true, false);
|
|
const int refNum = 23;
|
|
const int prbNum = 32;
|
|
ROMol *refMol = supplier[refNum];
|
|
ROMol *prbMol = supplier[prbNum];
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
TEST_ASSERT(refMP.isValid());
|
|
MMFF::MMFFMolProperties prbMP(*prbMol);
|
|
TEST_ASSERT(prbMP.isValid());
|
|
RWMol *patt = SmartsToMol("S");
|
|
MatchVectType matchVect;
|
|
TEST_ASSERT(SubstructMatch(*refMol, (ROMol &)*patt, matchVect));
|
|
delete patt;
|
|
unsigned int refSIdx = matchVect[0].second;
|
|
matchVect.clear();
|
|
patt = SmartsToMol("O");
|
|
TEST_ASSERT(SubstructMatch(*prbMol, (ROMol &)*patt, matchVect));
|
|
delete patt;
|
|
unsigned int prbOIdx = matchVect[0].second;
|
|
std::vector<double> distOS(2);
|
|
distOS[0] = 3.2;
|
|
distOS[1] = 0.3;
|
|
std::vector<double> weights(2);
|
|
weights[0] = 10.0;
|
|
weights[1] = 100.0;
|
|
for (unsigned int i = 0; i < 2; ++i) {
|
|
MatchVectType constraintMap;
|
|
constraintMap.push_back(std::make_pair(prbOIdx, refSIdx));
|
|
RDNumeric::DoubleVector constraintWeights(1);
|
|
constraintWeights[0] = weights[i];
|
|
auto *o3a = new MolAlign::O3A(*prbMol, *refMol, &prbMP, &refMP,
|
|
MolAlign::O3A::MMFF94, -1, -1, false, 50, 0,
|
|
&constraintMap, &constraintWeights);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
o3a = new MolAlign::O3A(*prbMol, *refMol, &prbMP, &refMP,
|
|
MolAlign::O3A::MMFF94, -1, -1, false, 50,
|
|
MolAlign::O3_LOCAL_ONLY);
|
|
TEST_ASSERT(o3a);
|
|
o3a->align();
|
|
delete o3a;
|
|
double d = (prbMol->getConformer().getAtomPos(prbOIdx) -
|
|
refMol->getConformer().getAtomPos(refSIdx))
|
|
.length();
|
|
TEST_ASSERT(feq(d, distOS[i], 0.1));
|
|
}
|
|
delete prbMol;
|
|
delete refMol;
|
|
}
|
|
|
|
#ifdef RDK_TEST_MULTITHREADED
|
|
namespace {
|
|
void runblock_o3a_mmff(ROMol *refMol, const std::vector<ROMol *> &mols,
|
|
const std::vector<double> &rmsds,
|
|
const std::vector<double> &scores, unsigned int count,
|
|
unsigned int idx) {
|
|
for (unsigned int rep = 0; rep < 10; ++rep) {
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
for (unsigned int i = 0; i < mols.size(); ++i) {
|
|
if (i % count != idx) {
|
|
continue;
|
|
}
|
|
if (!(rep % 10)) {
|
|
BOOST_LOG(rdErrorLog) << "Rep: " << rep << " Mol:" << i << std::endl;
|
|
}
|
|
ROMol prbMol(*mols[i]);
|
|
MMFF::MMFFMolProperties prbMP(prbMol);
|
|
MolAlign::O3A o3a(prbMol, *refMol, &prbMP, &refMP);
|
|
double rmsd = o3a.align();
|
|
double score = o3a.score();
|
|
TEST_ASSERT(feq(rmsd, rmsds[i]));
|
|
TEST_ASSERT(feq(score, scores[i]));
|
|
}
|
|
}
|
|
}
|
|
void runblock_o3a_crippen(ROMol *refMol, const std::vector<ROMol *> &mols,
|
|
const std::vector<double> &rmsds,
|
|
const std::vector<double> &scores, unsigned int count,
|
|
unsigned int idx) {
|
|
ROMol refMolCopy(*refMol);
|
|
for (unsigned int rep = 0; rep < 10; ++rep) {
|
|
unsigned int refNAtoms = refMolCopy.getNumAtoms();
|
|
std::vector<double> refLogpContribs(refNAtoms);
|
|
std::vector<double> refMRContribs(refNAtoms);
|
|
std::vector<unsigned int> refAtomTypes(refNAtoms);
|
|
std::vector<std::string> refAtomTypeLabels(refNAtoms);
|
|
Descriptors::getCrippenAtomContribs(refMolCopy, refLogpContribs,
|
|
refMRContribs, true, &refAtomTypes,
|
|
&refAtomTypeLabels);
|
|
for (unsigned int i = 0; i < mols.size(); ++i) {
|
|
if (i % count != idx) {
|
|
continue;
|
|
}
|
|
if (!(rep % 10)) {
|
|
BOOST_LOG(rdErrorLog) << "Rep: " << rep << " Mol:" << i << std::endl;
|
|
}
|
|
ROMol prbMol(*mols[i]);
|
|
unsigned int prbNAtoms = prbMol.getNumAtoms();
|
|
std::vector<double> prbLogpContribs(prbNAtoms);
|
|
std::vector<double> prbMRContribs(prbNAtoms);
|
|
std::vector<unsigned int> prbAtomTypes(prbNAtoms);
|
|
std::vector<std::string> prbAtomTypeLabels(prbNAtoms);
|
|
Descriptors::getCrippenAtomContribs(prbMol, prbLogpContribs,
|
|
prbMRContribs, true, &prbAtomTypes,
|
|
&prbAtomTypeLabels);
|
|
MolAlign::O3A o3a(prbMol, refMolCopy, &prbLogpContribs, &refLogpContribs,
|
|
MolAlign::O3A::CRIPPEN);
|
|
double rmsd = o3a.align();
|
|
double score = o3a.score();
|
|
TEST_ASSERT(feq(rmsd, rmsds[i]));
|
|
TEST_ASSERT(feq(score, scores[i]));
|
|
}
|
|
}
|
|
}
|
|
} // namespace
|
|
#include <thread>
|
|
#include <future>
|
|
void testMMFFO3AMultiThread() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2.sdf";
|
|
|
|
SDMolSupplier suppl(sdf, true, false);
|
|
|
|
std::vector<ROMol *> mols;
|
|
while (!suppl.atEnd() && mols.size() < 100) {
|
|
ROMol *mol = nullptr;
|
|
try {
|
|
mol = suppl.next();
|
|
} catch (...) {
|
|
continue;
|
|
}
|
|
if (!mol) {
|
|
continue;
|
|
}
|
|
mols.push_back(mol);
|
|
}
|
|
|
|
std::cerr << "generating reference data" << std::endl;
|
|
std::vector<double> rmsds(mols.size(), 0.0);
|
|
std::vector<double> scores(mols.size(), 0.0);
|
|
const int refNum = 48;
|
|
ROMol *refMol = mols[refNum];
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
|
|
for (unsigned int i = 0; i < mols.size(); ++i) {
|
|
ROMol prbMol(*mols[i]);
|
|
MMFF::MMFFMolProperties prbMP(prbMol);
|
|
MolAlign::O3A o3a(prbMol, *refMol, &prbMP, &refMP);
|
|
rmsds[i] = o3a.align();
|
|
scores[i] = o3a.score();
|
|
}
|
|
|
|
std::vector<std::future<void>> tg;
|
|
|
|
std::cerr << "processing" << std::endl;
|
|
unsigned int count = 4;
|
|
for (unsigned int i = 0; i < count; ++i) {
|
|
std::cerr << " launch :" << i << std::endl;
|
|
std::cerr.flush();
|
|
tg.emplace_back(std::async(std::launch::async, runblock_o3a_mmff, refMol,
|
|
mols, rmsds, scores, count, i));
|
|
}
|
|
for (auto &fut : tg) {
|
|
fut.get();
|
|
}
|
|
|
|
for (auto &&mol : mols) {
|
|
delete mol;
|
|
}
|
|
BOOST_LOG(rdErrorLog) << " done" << std::endl;
|
|
}
|
|
|
|
void testCrippenO3AMultiThread() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2.sdf";
|
|
|
|
SDMolSupplier suppl(sdf, true, false);
|
|
|
|
std::vector<ROMol *> mols;
|
|
while (!suppl.atEnd() && mols.size() < 100) {
|
|
ROMol *mol = nullptr;
|
|
try {
|
|
mol = suppl.next();
|
|
} catch (...) {
|
|
continue;
|
|
}
|
|
if (!mol) {
|
|
continue;
|
|
}
|
|
mols.push_back(mol);
|
|
}
|
|
|
|
std::cerr << "generating reference data" << std::endl;
|
|
std::vector<double> rmsds(mols.size(), 0.0);
|
|
std::vector<double> scores(mols.size(), 0.0);
|
|
const int refNum = 48;
|
|
ROMol *refMol = mols[refNum];
|
|
unsigned int refNAtoms = refMol->getNumAtoms();
|
|
std::vector<double> refLogpContribs(refNAtoms);
|
|
std::vector<double> refMRContribs(refNAtoms);
|
|
std::vector<unsigned int> refAtomTypes(refNAtoms);
|
|
std::vector<std::string> refAtomTypeLabels(refNAtoms);
|
|
Descriptors::getCrippenAtomContribs(*refMol, refLogpContribs, refMRContribs,
|
|
true, &refAtomTypes, &refAtomTypeLabels);
|
|
|
|
for (unsigned int i = 0; i < mols.size(); ++i) {
|
|
ROMol prbMol(*mols[i]);
|
|
unsigned int prbNAtoms = prbMol.getNumAtoms();
|
|
std::vector<double> prbLogpContribs(prbNAtoms);
|
|
std::vector<double> prbMRContribs(prbNAtoms);
|
|
std::vector<unsigned int> prbAtomTypes(prbNAtoms);
|
|
std::vector<std::string> prbAtomTypeLabels(prbNAtoms);
|
|
Descriptors::getCrippenAtomContribs(prbMol, prbLogpContribs, prbMRContribs,
|
|
true, &prbAtomTypes,
|
|
&prbAtomTypeLabels);
|
|
MolAlign::O3A o3a(prbMol, *refMol, &prbLogpContribs, &refLogpContribs,
|
|
MolAlign::O3A::CRIPPEN);
|
|
rmsds[i] = o3a.align();
|
|
scores[i] = o3a.score();
|
|
}
|
|
|
|
std::vector<std::future<void>> tg;
|
|
|
|
std::cerr << "processing" << std::endl;
|
|
unsigned int count = 4;
|
|
for (unsigned int i = 0; i < count; ++i) {
|
|
std::cerr << " launch :" << i << std::endl;
|
|
std::cerr.flush();
|
|
tg.emplace_back(std::async(std::launch::async, runblock_o3a_crippen, refMol,
|
|
mols, rmsds, scores, count, i));
|
|
}
|
|
for (auto &fut : tg) {
|
|
fut.get();
|
|
}
|
|
|
|
for (auto *mol : mols) {
|
|
delete mol;
|
|
}
|
|
BOOST_LOG(rdErrorLog) << " done" << std::endl;
|
|
}
|
|
#endif
|
|
|
|
void testGetO3AForProbeConfs() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/ref_e2.sdf";
|
|
|
|
SDMolSupplier suppl(sdf, true, false);
|
|
ROMol *refMol = suppl[13];
|
|
TEST_ASSERT(refMol);
|
|
|
|
sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/probe_mol.sdf";
|
|
SDMolSupplier psuppl(sdf, true, false);
|
|
ROMol *prbMol = psuppl.next();
|
|
TEST_ASSERT(prbMol);
|
|
while (!psuppl.atEnd()) {
|
|
ROMol *mol = psuppl.next();
|
|
if (!mol) {
|
|
continue;
|
|
}
|
|
auto *conf = new Conformer(mol->getConformer());
|
|
prbMol->addConformer(conf, true);
|
|
delete mol;
|
|
}
|
|
TEST_ASSERT(prbMol->getNumConformers() == 50);
|
|
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
MMFF::MMFFMolProperties prbMP(*prbMol);
|
|
|
|
std::vector<std::pair<double, double>> oscores;
|
|
for (unsigned int i = 0; i < prbMol->getNumConformers(); ++i) {
|
|
MolAlign::O3A o3a(*prbMol, *refMol, &prbMP, &refMP, MolAlign::O3A::MMFF94,
|
|
i);
|
|
double rmsd = o3a.align();
|
|
double score = o3a.score();
|
|
oscores.push_back(std::make_pair(rmsd, score));
|
|
}
|
|
|
|
{
|
|
std::vector<boost::shared_ptr<MolAlign::O3A>> o3s;
|
|
MolAlign::getO3AForProbeConfs(*prbMol, *refMol, &prbMP, &refMP, o3s);
|
|
TEST_ASSERT(o3s.size() == prbMol->getNumConformers());
|
|
for (unsigned int i = 0; i < prbMol->getNumConformers(); ++i) {
|
|
TEST_ASSERT(feq(oscores[i].first, o3s[i]->align()));
|
|
TEST_ASSERT(feq(oscores[i].second, o3s[i]->score()));
|
|
}
|
|
}
|
|
#ifdef RDK_TEST_MULTITHREADED
|
|
{
|
|
ROMol prbMol2(*prbMol);
|
|
unsigned int nDups = 10;
|
|
for (unsigned int j = 0; j < nDups; ++j) {
|
|
for (unsigned int i = 0; i < prbMol->getNumConformers(); ++i) {
|
|
prbMol2.addConformer(new Conformer(prbMol->getConformer(i)), true);
|
|
}
|
|
}
|
|
|
|
std::vector<boost::shared_ptr<MolAlign::O3A>> o3s;
|
|
MolAlign::getO3AForProbeConfs(prbMol2, *refMol, &prbMP, &refMP, o3s, 4);
|
|
TEST_ASSERT(o3s.size() == prbMol2.getNumConformers());
|
|
for (unsigned int i = 0; i < prbMol2.getNumConformers(); ++i) {
|
|
TEST_ASSERT(
|
|
feq(oscores[i % prbMol->getNumConformers()].first, o3s[i]->align()));
|
|
TEST_ASSERT(
|
|
feq(oscores[i % prbMol->getNumConformers()].second, o3s[i]->score()));
|
|
}
|
|
}
|
|
|
|
#endif
|
|
delete refMol;
|
|
delete prbMol;
|
|
|
|
BOOST_LOG(rdErrorLog) << " done" << std::endl;
|
|
}
|
|
|
|
void testO3AMultiThreadBug() {
|
|
std::string rdbase = getenv("RDBASE");
|
|
std::string sdf = rdbase + "/Code/GraphMol/MolAlign/test_data/bzr_data.sdf";
|
|
|
|
SDMolSupplier suppl(sdf, true, false);
|
|
|
|
std::vector<ROMol *> mols;
|
|
while (!suppl.atEnd()) {
|
|
ROMol *mol = suppl.next();
|
|
if (!mol) {
|
|
continue;
|
|
}
|
|
|
|
while (mol->getNumConformers() < 20) {
|
|
auto *conf = new Conformer(mol->getConformer(0));
|
|
mol->addConformer(conf, true);
|
|
}
|
|
mols.push_back(mol);
|
|
}
|
|
TEST_ASSERT(mols.size() == 10);
|
|
|
|
auto *refMol = new ROMol(*mols[0]);
|
|
TEST_ASSERT(refMol);
|
|
|
|
MMFF::MMFFMolProperties refMP(*refMol);
|
|
|
|
#ifdef RDK_TEST_MULTITHREADED
|
|
{
|
|
for (auto &mol : mols) {
|
|
ROMol prbMol = *mol;
|
|
TEST_ASSERT(prbMol.getNumConformers() == 20);
|
|
|
|
MMFF::MMFFMolProperties prbMP(prbMol);
|
|
|
|
std::vector<std::pair<double, double>> oscores;
|
|
for (unsigned int i = 0; i < prbMol.getNumConformers(); ++i) {
|
|
MolAlign::O3A o3a(prbMol, *refMol, &prbMP, &refMP,
|
|
MolAlign::O3A::MMFF94, i);
|
|
double rmsd = o3a.align();
|
|
double score = o3a.score();
|
|
oscores.push_back(std::make_pair(rmsd, score));
|
|
}
|
|
|
|
ROMol prbMol2 = *mol;
|
|
std::vector<boost::shared_ptr<MolAlign::O3A>> o3s;
|
|
MolAlign::getO3AForProbeConfs(prbMol2, *refMol, &prbMP, &refMP, o3s, 0);
|
|
TEST_ASSERT(o3s.size() == prbMol2.getNumConformers());
|
|
for (unsigned int i = 0; i < prbMol2.getNumConformers(); ++i) {
|
|
TEST_ASSERT(
|
|
feq(oscores[i % prbMol.getNumConformers()].first, o3s[i]->align()));
|
|
TEST_ASSERT(feq(oscores[i % prbMol.getNumConformers()].second,
|
|
o3s[i]->score()));
|
|
}
|
|
}
|
|
}
|
|
|
|
#endif
|
|
delete refMol;
|
|
for (auto &&mol : mols) {
|
|
delete mol;
|
|
}
|
|
BOOST_LOG(rdErrorLog) << " done" << std::endl;
|
|
}
|
|
|
|
int main() {
|
|
std::cout << "***********************************************************\n";
|
|
std::cout << "Testing O3AAlign\n";
|
|
|
|
#if 1
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testMMFFO3A \n\n";
|
|
testMMFFO3A();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testMMFFO3A with pre-computed dmat and MolHistogram\n\n";
|
|
testMMFFO3AMolHist();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testMMFFO3A with constraints\n\n";
|
|
testMMFFO3AConstraints();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testMMFFO3A with variable weight constraints followed by "
|
|
"local-only optimization\n\n";
|
|
testMMFFO3AConstraintsAndLocalOnly();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testCrippenO3A \n\n";
|
|
testCrippenO3A();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testCrippenO3A with pre-computed dmat and MolHistogram\n\n";
|
|
testCrippenO3AMolHist();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testCrippenO3A with constraints\n\n";
|
|
testCrippenO3AConstraints();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testCrippenO3A with variable weight constraints followed by "
|
|
"local-only optimization\n\n";
|
|
testCrippenO3AConstraintsAndLocalOnly();
|
|
|
|
#ifdef RDK_TEST_MULTITHREADED
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testMMFFO3A multithreading\n\n";
|
|
testMMFFO3AMultiThread();
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t test O3A multithreading bug\n\n";
|
|
testO3AMultiThreadBug();
|
|
#endif
|
|
|
|
#ifdef RDK_TEST_MULTITHREADED
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t testCrippenO3A multithreading\n\n";
|
|
testCrippenO3AMultiThread();
|
|
#endif
|
|
|
|
std::cout << "\t---------------------------------\n";
|
|
std::cout << "\t test getO3AForProbeConfs\n\n";
|
|
testGetO3AForProbeConfs();
|
|
#endif
|
|
|
|
std::cout << "***********************************************************\n";
|
|
}
|