| 12
 3
 4
 5
 6
 7
 8
 9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 
 | //
//  Copyright (C) 2018 Susan H. Leung
//
//   @@ All Rights Reserved @@
//  This file is part of the RDKit.
//  The contents are covered by the terms of the BSD license
//  which is included in the file license.txt, found at the root
//  of the RDKit source tree.
//
#include "TransformCatalogUtils.h"
#include <RDGeneral/BadFileException.h>
#include <boost/tokenizer.hpp>
#include <GraphMol/SmilesParse/SmilesParse.h>
#include <GraphMol/ChemReactions/ReactionParser.h>
#include <boost/algorithm/string.hpp>
#include <boost/tokenizer.hpp>
typedef boost::tokenizer<boost::char_separator<char>> tokenizer;
#include <fstream>
#include <string>
namespace RDKit {
namespace {
ChemicalReaction *getSmirks(const std::string &tmpStr) {
  ChemicalReaction *transformation = nullptr;
  if (tmpStr.length() == 0) {
    // empty line
    return transformation;
  }
  if (tmpStr.substr(0, 2) == "//") {
    // comment line
    return transformation;
  }
  boost::char_separator<char> tabSep("\t");
  tokenizer tokens(tmpStr, tabSep);
  tokenizer::iterator token = tokens.begin();
  // name of the functional groups
  std::string name = *token;
  boost::erase_all(name, " ");
  ++token;
  // grab the smirks:
  std::string smirks = *token;
  boost::erase_all(smirks, " ");
  ++token;
  transformation = RxnSmartsToChemicalReaction(smirks);
  CHECK_INVARIANT(transformation, smirks);
  transformation->setProp(common_properties::_Name, name);
  //  transformation->setProp(common_properties::_SMIRKS, smirks); // TODO
  //  RDGeneral/types.h does not have a common property to use?...
  return transformation;
}
}  // namespace
namespace MolStandardize {
std::vector<std::shared_ptr<ChemicalReaction>> readTransformations(
    std::string fileName) {
  std::ifstream inStream(fileName.c_str());
  if ((!inStream) || (inStream.bad())) {
    std::ostringstream errout;
    errout << "Bad input file " << fileName;
    throw BadFileException(errout.str());
  }
  std::vector<std::shared_ptr<ChemicalReaction>> transformations;
  transformations = readTransformations(inStream);
  return transformations;
}
std::vector<std::shared_ptr<ChemicalReaction>> readTransformations(
    std::istream &inStream, int nToRead) {
  std::vector<std::shared_ptr<ChemicalReaction>> transformations;
  transformations.clear();
  if (inStream.bad()) {
    throw BadFileException("Bad stream contents.");
  }
  const int MAX_LINE_LEN = 512;
  char inLine[MAX_LINE_LEN];
  std::string tmpstr;
  int nRead = 0;
  while (!inStream.eof() && !inStream.fail() && (nToRead < 0 || nRead < nToRead)) {
    inStream.getline(inLine, MAX_LINE_LEN, '\n');
    tmpstr = inLine;
    // parse the reaction on this line (if there is one)
    std::shared_ptr<ChemicalReaction> transformation(getSmirks(tmpstr));
    if (transformation) {
      transformations.push_back(transformation);
      nRead++;
    }
  }
  return transformations;
}
}  // namespace MolStandardize
}  // namespace RDKit
 |