Files
rdkit/Code/DataStructs/testFPB.cpp
2016-01-12 12:09:53 +01:00

131 lines
4.2 KiB
C++

//
// Copyright (C) 2015 Greg Landrum
//
// @@ All Rights Reserved @@
// This file is part of the RDKit.
// The contents are covered by the terms of the BSD license
// which is included in the file license.txt, found at the root
// of the RDKit source tree.
//
#include <RDGeneral/Invariant.h>
#include <RDGeneral/RDLog.h>
#include <RDGeneral/Exceptions.h>
#include <RDGeneral/utils.h>
#include <DataStructs/ExplicitBitVect.h>
#include <DataStructs/FPBReader.h>
using namespace RDKit;
void test1FPBReaderBasics() {
BOOST_LOG(rdInfoLog) << "-----------------------\n Testing FPBReader basics "
<< std::endl;
std::string pathName = getenv("RDBASE");
pathName += "/Code/DataStructs/testData/";
{
std::string filename = pathName + "zim.head100.fpb";
FPBReader fps(filename);
fps.init();
TEST_ASSERT(fps.length() == 100);
{ // pop counts
std::pair<unsigned int, unsigned int> offsets;
offsets = fps.getFPIdsInCountRange(17, 17);
TEST_ASSERT(offsets.first == 0);
TEST_ASSERT(offsets.second == 1);
offsets = fps.getFPIdsInCountRange(60, 65);
TEST_ASSERT(offsets.first == 96);
TEST_ASSERT(offsets.second == 100);
offsets = fps.getFPIdsInCountRange(160, 165);
TEST_ASSERT(offsets.first == 100);
TEST_ASSERT(offsets.second == 100);
}
{ // get* version
std::string nm = fps.getId(0);
TEST_ASSERT(nm == "ZINC00902219");
ExplicitBitVect *fp = fps.getFP(0);
TEST_ASSERT(fp);
TEST_ASSERT(fp->getNumBits() == 2048);
TEST_ASSERT(fp->getNumOnBits() == 17);
unsigned int obs[17] = {1, 80, 183, 222, 227, 231, 482, 650, 807,
811, 831, 888, 1335, 1411, 1664, 1820, 1917};
for (unsigned int i = 0; i < fp->getNumOnBits(); ++i) {
TEST_ASSERT(fp->getBit(obs[i]));
}
delete fp;
}
{ // operator[] version
std::pair<ExplicitBitVect *, std::string> tpl = fps[0];
ExplicitBitVect *fp = tpl.first;
TEST_ASSERT(fp);
TEST_ASSERT(fp->getNumBits() == 2048);
TEST_ASSERT(fp->getNumOnBits() == 17);
unsigned int obs[17] = {1, 80, 183, 222, 227, 231, 482, 650, 807,
811, 831, 888, 1335, 1411, 1664, 1820, 1917};
for (unsigned int i = 0; i < fp->getNumOnBits(); ++i) {
TEST_ASSERT(fp->getBit(obs[i]));
}
delete fp;
TEST_ASSERT(tpl.second == "ZINC00902219");
}
{ // test another fp
ExplicitBitVect *fp = fps.getFP(3);
TEST_ASSERT(fp);
TEST_ASSERT(fp->getNumBits() == 2048);
TEST_ASSERT(fp->getNumOnBits() == 20);
unsigned int obs[20] = {1, 8, 80, 95, 222, 227, 457,
482, 650, 680, 715, 807, 831, 845,
888, 1226, 1556, 1711, 1917, 1982};
for (unsigned int i = 0; i < fp->getNumOnBits(); ++i) {
TEST_ASSERT(fp->getBit(obs[i]));
}
delete fp;
std::string nm = fps.getId(3);
TEST_ASSERT(nm == "ZINC04803506");
}
}
BOOST_LOG(rdInfoLog) << "Finished" << std::endl;
}
void test2FPBReaderTanimoto() {
BOOST_LOG(rdInfoLog)
<< "-----------------------\n Testing FPBReader tanimoto " << std::endl;
std::string pathName = getenv("RDBASE");
pathName += "/Code/DataStructs/testData/";
{
std::string filename = pathName + "zim.head100.fpb";
FPBReader fps(filename);
fps.init();
TEST_ASSERT(fps.length() == 100);
{
boost::uint8_t *bytes = fps.getBytes(0);
TEST_ASSERT(bytes);
TEST_ASSERT(feq(fps.getTanimoto(0, bytes), 1.0));
TEST_ASSERT(feq(fps.getTanimoto(1, bytes), 0.3703));
delete[] bytes;
}
{
boost::uint8_t *bytes = fps.getBytes(1);
TEST_ASSERT(bytes);
TEST_ASSERT(feq(fps.getTanimoto(1, bytes), 1.0));
TEST_ASSERT(feq(fps.getTanimoto(0, bytes), 0.3703));
TEST_ASSERT(feq(fps.getTanimoto(2, bytes), 1.0));
TEST_ASSERT(feq(fps.getTanimoto(5, bytes), 0.2903));
delete[] bytes;
}
}
BOOST_LOG(rdInfoLog) << "Finished" << std::endl;
}
int main() {
RDLog::InitLogs();
test1FPBReaderBasics();
test2FPBReaderTanimoto();
// FIX: test extractBytes()
// FIX: need testing of edge cases
return 0;
}