File: testMolProcessing.py

package info (click to toggle)
rdkit 202503.1-5
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 220,160 kB
  • sloc: cpp: 399,240; python: 77,453; ansic: 25,517; java: 8,173; javascript: 4,005; sql: 2,389; yacc: 1,565; lex: 1,263; cs: 1,081; makefile: 580; xml: 229; fortran: 183; sh: 105
file content (56 lines) | stat: -rw-r--r-- 2,079 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#
#  Copyright (C) 2024 Greg Landrum and other RDKit contributors
#   @@ All Rights Reserved @@
#
#  This file is part of the RDKit.
#  The contents are covered by the terms of the BSD license
#  which is included in the file license.txt, found at the root
#  of the RDKit source tree.

import unittest

#
from rdkit import Chem
from rdkit.Chem import rdMolProcessing
from rdkit.Chem import rdFingerprintGenerator
from rdkit import DataStructs
from rdkit import RDConfig


class TestCase(unittest.TestCase):

  def setUp(self):
    self.smiFile = RDConfig.RDBaseDir + '/Regress/Data/zinc.leads.500.q.smi'
    self.sdFile = RDConfig.RDBaseDir + "/Data/NCI/first_200.props.sdf"

  def test1(self):
    fpg = rdFingerprintGenerator.GetMorganGenerator()
    fps = rdMolProcessing.GetFingerprintsForMolsInFile(self.smiFile)
    self.assertEqual(len(fps), 499)
    with Chem.SmilesMolSupplier(self.smiFile, delimiter='\t') as suppl:
      mols = [next(suppl) for _ in range(3)]
    nfps = [fpg.GetFingerprint(m) for m in mols]
    self.assertEqual(DataStructs.TanimotoSimilarity(fps[0], fps[1]),
                     DataStructs.TanimotoSimilarity(nfps[0], nfps[1]))

    fps = rdMolProcessing.GetFingerprintsForMolsInFile(self.sdFile)
    self.assertEqual(len(fps), 200)
    with Chem.SDMolSupplier(self.sdFile) as suppl:
      mols = [next(suppl) for _ in range(3)]
    nfps = [fpg.GetFingerprint(m) for m in mols]
    self.assertAlmostEqual(DataStructs.TanimotoSimilarity(fps[0], fps[1]), 0.0638, places=3)

  def test2(self):
    fpg = rdFingerprintGenerator.GetMorganGenerator(radius=2)

    fps = rdMolProcessing.GetFingerprintsForMolsInFile(self.smiFile, generator=fpg)
    self.assertEqual(len(fps), 499)
    with Chem.SmilesMolSupplier(self.smiFile, delimiter='\t') as suppl:
      mols = [next(suppl) for _ in range(3)]
    nfps = [fpg.GetFingerprint(m) for m in mols]
    self.assertEqual(DataStructs.TanimotoSimilarity(fps[0], fps[1]),
                     DataStructs.TanimotoSimilarity(nfps[0], nfps[1]))


if __name__ == '__main__':  # pragma: nocover
  unittest.main()