Files
rdkit/Code/GraphMol/MolStandardize/AcidBaseCatalog/AcidBaseCatalogUtils.cpp
Greg Landrum ec366c1ab7 Dev/pvs studio cleanups2 (#2877)
* a round of cleanups courtesy of PVS studio

* add a test to make sure that a warning is a false alarm

* bug fix

* Fix a UFF bug

* more PVS studio cleanups

* next round of PVS studio cleanups

* completely remove the chances for that bug

* changes in response to review

* add an additional test
+ a bit of reformatting that snuck in
2020-01-22 15:10:58 +01:00

106 lines
3.0 KiB
C++

//
// Copyright (C) 2018 Susan H. Leung
//
// @@ All Rights Reserved @@
// This file is part of the RDKit.
// The contents are covered by the terms of the BSD license
// which is included in the file license.txt, found at the root
// of the RDKit source tree.
//
#include "AcidBaseCatalogUtils.h"
#include <RDGeneral/BadFileException.h>
#include <GraphMol/SmilesParse/SmilesParse.h>
#include <boost/algorithm/string.hpp>
#include <boost/tokenizer.hpp>
typedef boost::tokenizer<boost::char_separator<char>> tokenizer;
#include <fstream>
#include <string>
namespace RDKit {
namespace {
std::pair<ROMol*, ROMol*>* getPair(const std::string& tmpStr) {
std::pair<ROMol*, ROMol*>* mol_pair = nullptr;
if (tmpStr.length() == 0) {
// empty line
return mol_pair;
}
if (tmpStr.substr(0, 2) == "//") {
// comment line
return mol_pair;
}
boost::char_separator<char> tabSep("\t");
tokenizer tokens(tmpStr, tabSep);
tokenizer::iterator token = tokens.begin();
// name of the functional groups
std::string name = *token;
boost::erase_all(name, " ");
++token;
// grab the acid :
std::string acid_smarts = *token;
boost::erase_all(acid_smarts, " ");
++token;
// grab the base:
std::string base_smarts = *token;
boost::erase_all(base_smarts, " ");
++token;
ROMol* acid(SmartsToMol(acid_smarts));
ROMol* base(SmartsToMol(base_smarts));
CHECK_INVARIANT(acid, acid_smarts);
CHECK_INVARIANT(base, base_smarts);
acid->setProp(common_properties::_Name, name);
base->setProp(common_properties::_Name, name);
mol_pair = new std::pair<ROMol*, ROMol*>(acid, base);
return mol_pair;
}
} // namespace
namespace MolStandardize {
std::vector<std::pair<ROMOL_SPTR, ROMOL_SPTR>> readPairs(std::string fileName) {
std::ifstream inStream(fileName.c_str());
if ((!inStream) || (inStream.bad())) {
std::ostringstream errout;
errout << "Bad input file " << fileName;
throw BadFileException(errout.str());
}
std::vector<std::pair<ROMOL_SPTR, ROMOL_SPTR>> mol_pairs =
readPairs(inStream);
return mol_pairs;
}
std::vector<std::pair<ROMOL_SPTR, ROMOL_SPTR>> readPairs(std::istream& inStream,
int nToRead) {
std::vector<std::pair<ROMOL_SPTR, ROMOL_SPTR>> pairs;
pairs.clear();
if (inStream.bad()) {
throw BadFileException("Bad stream contents.");
}
const int MAX_LINE_LEN = 512;
char inLine[MAX_LINE_LEN];
std::string tmpstr;
int nRead = 0;
while (!inStream.eof() && !inStream.fail() && (nToRead < 0 || nRead < nToRead)) {
inStream.getline(inLine, MAX_LINE_LEN, '\n');
tmpstr = inLine;
// parse the molpair on this line (if there is one)
std::shared_ptr<std::pair<ROMol*, ROMol*>> mol_pair(getPair(tmpstr));
if (mol_pair != nullptr) {
pairs.push_back(std::pair<ROMOL_SPTR, ROMOL_SPTR>(
ROMOL_SPTR(mol_pair->first), ROMOL_SPTR(mol_pair->second)));
nRead++;
}
}
return pairs;
}
} // namespace MolStandardize
} // namespace RDKit