File: MotifToolsTest.java

package info (click to toggle)
biojava-live 1%3A1.7.1-8
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 55,160 kB
  • sloc: java: 180,820; xml: 6,908; sql: 510; makefile: 50
file content (142 lines) | stat: -rw-r--r-- 3,641 bytes parent folder | download | duplicates (7)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
/*
 *                    BioJava development code
 *
 * This code may be freely distributed and modified under the
 * terms of the GNU Lesser General Public Licence.  This should
 * be distributed with the code.  If you do not have a copy,
 * see:
 *
 *      http://www.gnu.org/copyleft/lesser.html
 *
 * Copyright for this code is held jointly by the individual
 * authors.  These should be listed in @author doc comments.
 *
 * For more information on the BioJava project and its aims,
 * or to join the biojava-l mailing list, visit the home page
 * at:
 *
 *      http://www.biojava.org/
 *
 */

package org.biojava.bio.symbol;

import java.util.ArrayList;
import java.util.Arrays;
import java.util.Iterator;
import java.util.List;
import java.util.Set;

import junit.framework.TestCase;

import org.biojava.bio.seq.DNATools;
import org.biojava.bio.seq.io.SymbolTokenization;
import org.biojava.utils.AssertionFailure;

public class MotifToolsTest
    extends TestCase {

    protected String n;

    protected void setUp() {
      try {
          StringBuffer sb = new StringBuffer();
          sb.append("[");
          SymbolTokenization sTok = DNATools.getDNA().getTokenization("token");
          FiniteAlphabet na = (FiniteAlphabet) DNATools.n().getMatches();

          Set rawSyms = AlphabetManager.getAllSymbols(na);
          List gapSyms = new ArrayList();

          for (Iterator si = rawSyms.iterator(); si.hasNext();) {
              Symbol rawSym = (Symbol) si.next();
              // Crude check for gap symbol
              if (((FiniteAlphabet) rawSym.getMatches()).size() == 0) {
                  gapSyms.add(rawSym);
              }
          }

          rawSyms.removeAll(gapSyms);

          // getAllSymbols returns a Set (i.e. unordered) so
          // we convert to char array so we can sort tokens
          Symbol [] nSyms = (Symbol []) rawSyms.toArray(new Symbol [0]);
          char [] nChars = new char [nSyms.length];

          for (int i = 0; i < nSyms.length; i++) {
              nChars[i] = sTok.tokenizeSymbol(nSyms[i]).charAt(0);
          }

          Arrays.sort(nChars);
          sb.append(nChars);
          sb.append("]");
          n = sb.toString();
      } catch (Exception e) {
          throw new AssertionFailure("Couldn't initialize motif tools test", e);
      }
    }

    public MotifToolsTest(String name) {
        super(name);
    }

    public void testPlain() {
        doTest("atcg", "atcg");
    }

    public void testTwoStart() {
        doTest("aatcg", "a{2}tcg");
    }

    public void testThreeStart() {
        doTest("aaatcg", "a{3}tcg");
    }

    public void testTwoInternal() {
        doTest("attcg", "at{2}cg");
    }

    public void testThreeInternal() {
        doTest("atttcg", "at{3}cg");
    }

    public void testTwoEnd() {
        doTest("atcgg", "atcg{2}");
    }

    public void testThreeEnd() {
        doTest("atcggg", "atcg{3}");
    }

    public void testTwoOnly() {
        doTest("aa", "a{2}");
    }

    public void testThreeOnly() {
        doTest("aaa", "a{3}");
    }

    public void testAmbStart() {
        doTest("ngct", n + "gct");
    }

    public void testAmbMiddle() {
        doTest("anct", "a" + n + "ct");
    }

    public void testAmbEnd() {
        doTest("agcn", "agc" + n);
    }

    public void testTwoAmbOnly() {
        doTest("nn", n + "{2}");
    }

    void doTest(String pattern, String target) {
        try {
            assertEquals(target, MotifTools.createRegex(DNATools.createDNA(pattern)));
        } catch (IllegalSymbolException ise) {
            throw new AssertionFailure(ise);
        }
    }
}