File: test_alignment_fiddling.py

package info (click to toggle)
promod3 3.2.1%2Bds-6
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 1,033,844 kB
  • sloc: cpp: 55,507; python: 17,487; makefile: 84; sh: 51
file content (129 lines) | stat: -rw-r--r-- 6,349 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
# Copyright (c) 2013-2020, SIB - Swiss Institute of Bioinformatics and
#                          Biozentrum - University of Basel
# 
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# 
#   http://www.apache.org/licenses/LICENSE-2.0
# 
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


"""
Unit tests for alignment fiddling.
"""
import unittest
from promod3 import modelling
from ost import seq, io

class ModellingTests(unittest.TestCase):

    def testDeleteGapCols(self):
        aln = io.LoadAlignment('data/double_gap_aln.fasta')
        s0_orig = aln.GetSequence(0)
        s1_orig = aln.GetSequence(1)
        # recreate aln with added offsets and attach some random structure to 
        # both sequences
        s0 = seq.CreateSequence(s0_orig.GetName(), str(s0_orig))
        s1 = seq.CreateSequence(s1_orig.GetName(), str(s1_orig))
        s0.SetOffset(1)
        s1.SetOffset(2)
        random_structure = io.LoadPDB('data/1CRN.pdb')
        s0.AttachView(random_structure.CreateFullView())
        s1.AttachView(random_structure.CreateFullView())
        pimped_aln = seq.CreateAlignment()
        pimped_aln.AddSequence(s0)
        pimped_aln.AddSequence(s1)
        processed_aln = modelling.DeleteGapCols(pimped_aln)
        processed_s0 = processed_aln.GetSequence(0)
        processed_s1 = processed_aln.GetSequence(1)
       
        # the following things should be equal between sx and processed_sx:
        # - name
        # - offset
        # - view attached
        self.assertEqual(s0.GetName(), processed_s0.GetName())
        self.assertEqual(s1.GetName(), processed_s1.GetName())
        self.assertEqual(s0.GetOffset(), processed_s0.GetOffset())
        self.assertEqual(s1.GetOffset(), processed_s1.GetOffset())
        self.assertTrue(processed_s0.HasAttachedView())
        self.assertTrue(processed_s1.HasAttachedView())

        # the actual sequences changed and are checked with the expected outcome
        self.assertEqual(str(processed_s0), 'ABCDEFG-H--I')
        self.assertEqual(str(processed_s1), 'ABCDEFGHIJKL')


    def testPullTerminalDeletions(self):

        aln = io.LoadAlignment('data/terminal_deletion_aln.fasta')

        # min_terminal_anchor_sizes which are <= 0 are disallowed
        self.assertRaises(RuntimeError, modelling.PullTerminalDeletions, aln, -10)
        self.assertRaises(RuntimeError, modelling.PullTerminalDeletions, aln, 0)

        # check expected results for different min_terminal_anchor_sizes

        # nothing should happen for anchor size 1
        processed_aln = modelling.PullTerminalDeletions(aln, 1)
        self.assertEqual(str(aln.GetSequence(0)), str(processed_aln.GetSequence(0)))
        self.assertEqual(str(aln.GetSequence(1)), str(processed_aln.GetSequence(1)))

        processed_aln = modelling.PullTerminalDeletions(aln, 2)
        exp_s0 = 'GSHMG----DLK--------------YSLERLREILERLEENPSEKQIVEAIRAIVENNAQIVE--AAIE-NNAQIVENNRAIIEALEAIGVDQKILEEMKKQLKDLKRSLERG'
        exp_s1 = '-----DAQDKLKYLVKQLERALRELKKSLDELERSLEELEKNPSEDALVENNRLNVENNKIIVEVLRIILE-------------------------------------------'
        self.assertEqual(str(processed_aln.GetSequence(0)), exp_s0)
        self.assertEqual(str(processed_aln.GetSequence(1)), exp_s1)

        processed_aln = modelling.PullTerminalDeletions(aln, 3)
        exp_s0 = 'GSHMG----DLK--------------YSLERLREILERLEENPSEKQIVEAIRAIVENNAQIVE--AAIE-NNAQIVENNRAIIEALEAIGVDQKILEEMKKQLKDLKRSLERG'
        exp_s1 = '-----DAQDKLKYLVKQLERALRELKKSLDELERSLEELEKNPSEDALVENNRLNVENNKIIVEVLRIILE-------------------------------------------'
        self.assertEqual(str(processed_aln.GetSequence(0)), exp_s0)
        self.assertEqual(str(processed_aln.GetSequence(1)), exp_s1)

        processed_aln = modelling.PullTerminalDeletions(aln, 4)
        exp_s0 = 'GSHMG------------------DLKYSLERLREILERLEENPSEKQIVEAIRAIVENNAQIVE--AAIE-NNAQIVENNRAIIEALEAIGVDQKILEEMKKQLKDLKRSLERG'
        exp_s1 = '-----DAQDKLKYLVKQLERALRELKKSLDELERSLEELEKNPSEDALVENNRLNVENNKIIVEVLRIILE-------------------------------------------'
        self.assertEqual(str(processed_aln.GetSequence(0)), exp_s0)
        self.assertEqual(str(processed_aln.GetSequence(1)), exp_s1)

        processed_aln = modelling.PullTerminalDeletions(aln, 5)
        exp_s0 = 'GSHMG------------------DLKYSLERLREILERLEENPSEKQIVEAIRAIVENNAQIVEAAIE---NNAQIVENNRAIIEALEAIGVDQKILEEMKKQLKDLKRSLERG'
        exp_s1 = '-----DAQDKLKYLVKQLERALRELKKSLDELERSLEELEKNPSEDALVENNRLNVENNKIIVEVLRIILE-------------------------------------------'
        self.assertEqual(str(processed_aln.GetSequence(0)), exp_s0)
        self.assertEqual(str(processed_aln.GetSequence(1)), exp_s1)

        # also check, whether sequence name, offsets and attached views are preserved
        random_structure = io.LoadPDB('data/1CRN.pdb')
        s0 = seq.CreateSequence(aln.GetSequence(0).GetName(), str(aln.GetSequence(0)))
        s1 = seq.CreateSequence(aln.GetSequence(1).GetName(), str(aln.GetSequence(1)))
        s0.AttachView(random_structure.CreateFullView())
        s1.AttachView(random_structure.CreateFullView())
        pimped_aln = seq.CreateAlignment()
        pimped_aln.AddSequence(s0)
        pimped_aln.AddSequence(s1)
        processed_aln = modelling.PullTerminalDeletions(pimped_aln, 5)
        processed_s0 = processed_aln.GetSequence(0)
        processed_s1 = processed_aln.GetSequence(1)
       
        # the following things should be equal between sx and processed_sx:
        # - name
        # - offset
        # - view attached
        self.assertEqual(s0.GetName(), processed_s0.GetName())
        self.assertEqual(s1.GetName(), processed_s1.GetName())
        self.assertEqual(s0.GetOffset(), processed_s0.GetOffset())
        self.assertEqual(s1.GetOffset(), processed_s1.GetOffset())
        self.assertTrue(processed_s0.HasAttachedView())
        self.assertTrue(processed_s1.HasAttachedView())


if __name__ == "__main__":
    from ost import testutils
    testutils.RunTests()