File: test_nbrf_io.py

package info (click to toggle)
python-weblogo 3.8.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid, trixie
  • size: 3,700 kB
  • sloc: xml: 14,455; python: 10,384; sh: 140; makefile: 58
file content (125 lines) | stat: -rwxr-xr-x 4,929 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
#!/usr/bin/env python

#  Copyright (c) 2006, The Regents of the University of California, through
#  Lawrence Berkeley National Laboratory (subject to receipt of any required
#  approvals from the U.S. Dept. of Energy).  All rights reserved.

#  This software is distributed under the new BSD Open Source License.
#  <http://www.opensource.org/licenses/bsd-license.html>
#
#  Redistribution and use in source and binary forms, with or without
#  modification, are permitted provided that the following conditions are met:
#
#  (1) Redistributions of source code must retain the above copyright notice,
#  this list of conditions and the following disclaimer.
#
#  (2) Redistributions in binary form must reproduce the above copyright
#  notice, this list of conditions and the following disclaimer in the
#  documentation and or other materials provided with the distribution.
#
#  (3) Neither the name of the University of California, Lawrence Berkeley
#  National Laboratory, U.S. Dept. of Energy nor the names of its contributors
#  may be used to endorse or promote products derived from this software
#  without specific prior written permission.
#
#  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
#  AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
#  IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
#  ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
#  LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
#  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
#  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
#  INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
#  CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
#  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
#  POSSIBILITY OF SUCH DAMAGE.

import unittest
from io import StringIO

from weblogo.seq import dna_alphabet, protein_alphabet
from weblogo.seq_io import clustal_io, nbrf_io, plain_io

from . import data_stream


class test_nbrf_io(unittest.TestCase):
    def test_parse_cox2(self) -> None:
        f = data_stream("cox2.nbrf")
        seqs = nbrf_io.read(f)
        self.assertEqual(len(seqs), 5)
        self.assertEqual(len(seqs[1]), 210)
        self.assertEqual(
            str(seqs[0]),
            "MAFILSFWMIFLLDSVIVLLSFVCFVCVWICALLFSTVLLVSKLNNIYCTWDFTASKFIDVYWFTIGGMFSLG"
            "LLLRLCLLLYFGHLNFVSFDLCKVVGFQWYWVYFIFGETTIFSNLILESDYMIGDLRLLQCNHVLTLLSLVIY"
            "KLWLSAVDVIHSFAISSLGVKVENLVAVMK",
        )
        self.assertEqual(seqs[0].alphabet, protein_alphabet)
        f.close()

    def test_parse_crab(self) -> None:
        f = data_stream("crab.nbrf")
        seqs = nbrf_io.read(f)
        self.assertEqual(seqs[0].alphabet, protein_alphabet)
        self.assertEqual(len(seqs), 9)
        self.assertEqual(seqs[2].name, "CRAB_CHICK")
        self.assertEqual(
            seqs[2].description, "ALPHA CRYSTALLIN B CHAIN (ALPHA(B)-CRYSTALLIN)."
        )
        f.close()

    def test_parse_dna(self) -> None:
        f = data_stream("dna.pir")
        seqs = nbrf_io.read(f)
        self.assertEqual(seqs[0].alphabet, dna_alphabet)
        self.assertEqual(len(seqs), 10)
        f.close()

    def test_parse_examples(self) -> None:
        f = data_stream("rhod.pir")
        seqs = nbrf_io.read(f)
        self.assertEqual(seqs[0].alphabet, protein_alphabet)
        self.assertEqual(len(seqs), 3)
        f.close()

    def test_parse_protein(self) -> None:
        f = data_stream("protein.pir")
        seqs = nbrf_io.read(f)
        self.assertEqual(seqs[0].alphabet, protein_alphabet)
        self.assertEqual(len(seqs), 10)
        f.close()

    def test_parse_clustal_fail(self) -> None:
        # should fail with parse error
        f = StringIO(clustal_io.example)
        self.assertRaises(ValueError, nbrf_io.read, f, protein_alphabet)

    def test_parse_plain_fail(self) -> None:
        # should fail with parse error
        f = StringIO(plain_io.example)
        self.assertRaises(ValueError, nbrf_io.read, f)

    def test_pir_file_from_clustal(self) -> None:
        f = data_stream("clustalw.pir")
        seqs = nbrf_io.read(f)
        self.assertEqual(len(seqs), 2)
        self.assertEqual(
            seqs[1].endswith(
                "C-AATC-G-CAATG-G--CTTGAACCGGGTAAAAGTCGT-A----------------------------------------"
                "-----------------------------------------"
            ),
            True,
        )
        f.close()

    def test_parse_examples_alphabet(self) -> None:
        f = data_stream("rhod.pir")
        seqs = nbrf_io.read(f, alphabet=protein_alphabet)
        self.assertEqual(seqs[0].alphabet, protein_alphabet)
        self.assertEqual(len(seqs), 3)
        f.close()


if __name__ == "__main__":
    unittest.main()