1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97
|
//
// Copyright (C) 2018 Susan H. Leung
//
// @@ All Rights Reserved @@
// This file is part of the RDKit.
// The contents are covered by the terms of the BSD license
// which is included in the file license.txt, found at the root
// of the RDKit source tree.
//
#include "TransformCatalogUtils.h"
#include <RDGeneral/BadFileException.h>
#include <boost/tokenizer.hpp>
#include <GraphMol/SmilesParse/SmilesParse.h>
#include <GraphMol/ChemReactions/ReactionParser.h>
#include <boost/algorithm/string.hpp>
#include <boost/tokenizer.hpp>
typedef boost::tokenizer<boost::char_separator<char>> tokenizer;
#include <fstream>
#include <string>
namespace RDKit {
namespace {
ChemicalReaction *getSmirks(const std::string &tmpStr) {
ChemicalReaction *transformation = nullptr;
if (tmpStr.length() == 0) {
// empty line
return transformation;
}
if (tmpStr.substr(0, 2) == "//") {
// comment line
return transformation;
}
boost::char_separator<char> tabSep("\t");
tokenizer tokens(tmpStr, tabSep);
tokenizer::iterator token = tokens.begin();
// name of the functional groups
std::string name = *token;
boost::erase_all(name, " ");
++token;
// grab the smirks:
std::string smirks = *token;
boost::erase_all(smirks, " ");
++token;
transformation = RxnSmartsToChemicalReaction(smirks);
CHECK_INVARIANT(transformation, smirks);
transformation->setProp(common_properties::_Name, name);
// transformation->setProp(common_properties::_SMIRKS, smirks); // TODO
// RDGeneral/types.h does not have a common property to use?...
return transformation;
}
} // namespace
namespace MolStandardize {
std::vector<std::shared_ptr<ChemicalReaction>> readTransformations(
std::string fileName) {
std::ifstream inStream(fileName.c_str());
if ((!inStream) || (inStream.bad())) {
std::ostringstream errout;
errout << "Bad input file " << fileName;
throw BadFileException(errout.str());
}
std::vector<std::shared_ptr<ChemicalReaction>> transformations;
transformations = readTransformations(inStream);
return transformations;
}
std::vector<std::shared_ptr<ChemicalReaction>> readTransformations(
std::istream &inStream, int nToRead) {
std::vector<std::shared_ptr<ChemicalReaction>> transformations;
transformations.clear();
if (inStream.bad()) {
throw BadFileException("Bad stream contents.");
}
const int MAX_LINE_LEN = 512;
char inLine[MAX_LINE_LEN];
std::string tmpstr;
int nRead = 0;
while (!inStream.eof() && (nToRead < 0 || nRead < nToRead)) {
inStream.getline(inLine, MAX_LINE_LEN, '\n');
tmpstr = inLine;
// parse the reaction on this line (if there is one)
std::shared_ptr<ChemicalReaction> transformation(getSmirks(tmpstr));
if (transformation) {
transformations.push_back(transformation);
nRead++;
}
}
return transformations;
}
} // namespace MolStandardize
} // namespace RDKit
|