File: MaximumCommonSubgraph.h

package info (click to toggle)
rdkit 202503.1-5
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 220,160 kB
  • sloc: cpp: 399,240; python: 77,453; ansic: 25,517; java: 8,173; javascript: 4,005; sql: 2,389; yacc: 1,565; lex: 1,263; cs: 1,081; makefile: 580; xml: 229; fortran: 183; sh: 105
file content (106 lines) | stat: -rw-r--r-- 3,485 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
//
//  Copyright (C) 2014 Novartis Institutes for BioMedical Research
//
//   @@ All Rights Reserved @@
//  This file is part of the RDKit.
//  The contents are covered by the terms of the BSD license
//  which is included in the file license.txt, found at the root
//  of the RDKit source tree.
//
#include <RDGeneral/export.h>
#pragma once
#include <vector>
#include <string>
#include <stdexcept>
#include "../RDKitBase.h"
#include "FMCS.h"
#include "DebugTrace.h"  // algorithm filter definitions
#include "SeedSet.h"
#include "Target.h"
#include "SubstructureCache.h"
#include "DuplicatedSeedCache.h"
#include "MatchTable.h"
#include "TargetMatch.h"

namespace RDKit {

inline bool FinalChiralityCheckFunction(
    const std::uint32_t c1[], const std::uint32_t c2[], const ROMol &mol1,
    const FMCS::Graph &query, const ROMol &mol2, const FMCS::Graph &target,
    const MCSParameters *p);

bool FinalMatchCheckFunction(const std::uint32_t c1[], const std::uint32_t c2[],
                             const ROMol &mol1, const FMCS::Graph &query,
                             const ROMol &mol2, const FMCS::Graph &target,
                             const MCSParameters *p);

namespace FMCS {
class RDKIT_FMCS_EXPORT MaximumCommonSubgraph {
  // current result. Reference to a fragment of source molecule
  struct MCS {
    std::vector<const Atom *> Atoms;
    std::vector<const Bond *> Bonds;
    const ROMol *QueryMolecule;
    std::vector<Target> Targets;
  };
  unsigned long long To;
  MCSProgressData Stat;
  detail::MCSParametersInternal Parameters;
  // min number of matches
  unsigned int ThresholdCount;
  std::vector<const ROMol *> Molecules;
#ifdef FAST_SUBSTRUCT_CACHE
  // for Morgan code. Value based on current functor and parameters
  std::vector<unsigned int> QueryAtomLabels;
  // for Morgan code. Value based on current functor and parameters
  std::vector<unsigned int> QueryBondLabels;
  SubstructureCache HashCache;
  MatchTable QueryAtomMatchTable;
  MatchTable QueryBondMatchTable;
#endif
#ifdef DUP_SUBSTRUCT_CACHE
  DuplicatedSeedCache DuplicateCache;
#endif
  const ROMol *QueryMolecule;
  unsigned int QueryMoleculeMatchedBonds;
  unsigned int QueryMoleculeMatchedAtoms;
  const Atom *QueryMoleculeSingleMatchedAtom;
  std::vector<Target> Targets;
  SeedSet Seeds;
  MCS McsIdx;
  std::map<std::vector<unsigned int>, MCS> DegenerateMcsMap;

 public:
#ifdef VERBOSE_STATISTICS_ON
  ExecStatistics VerboseStatistics;
#endif

  MaximumCommonSubgraph(const MCSParameters *params);
  ~MaximumCommonSubgraph() { clear(); }
  MCSResult find(const std::vector<ROMOL_SPTR> &mols);
  const ROMol &getQueryMolecule() const { return *QueryMolecule; }
  unsigned int getMaxNumberBonds() const { return McsIdx.Bonds.size(); }

  unsigned int getMaxNumberAtoms() const { return McsIdx.Atoms.size(); }
  bool checkIfMatchAndAppend(Seed &seed);
  bool match(Seed &seed);
  const MCSParameters &parameters() const { return Parameters; }
  MCSParameters &parameters() { return Parameters; }

 private:
  void clear() {
    Targets.clear();
    Molecules.clear();
    To = nanoClock();
  }
  void init(size_t startIdx);
  void makeInitialSeeds();
  bool createSeedFromMCS(size_t newQueryTarget, Seed &seed);
  bool growSeeds();  // returns false if canceled
  std::pair<std::string, ROMOL_SPTR> generateResultSMARTSAndQueryMol(
      const MCS &mcsIdx) const;

  bool matchIncrementalFast(Seed &seed, unsigned int itarget);
};
}  // namespace FMCS
}  // namespace RDKit