File: GuessSeqFormat.t

package info (click to toggle)
bioperl 1.7.8-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, sid, trixie
  • size: 35,788 kB
  • sloc: perl: 94,019; xml: 14,811; makefile: 20
file content (144 lines) | stat: -rw-r--r-- 3,392 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
# -*-Perl-*- Test Harness script for Bioperl
# $Id$

use strict;

BEGIN {
    use Bio::Root::Test;
   
    test_begin(-tests => 105);
   
    use_ok 'Bio::Tools::GuessSeqFormat';
    use_ok 'Bio::SeqIO';
    use_ok 'Bio::AlignIO';
}


ok my $guesser = Bio::Tools::GuessSeqFormat->new;
isa_ok $guesser, 'Bio::Tools::GuessSeqFormat';


#
# Test guesser interfaces
#

# 1/ File guess
ok $guesser = Bio::Tools::GuessSeqFormat->new(
    -file => test_input_file('test.fasta'),
), 'File input';
is $guesser->guess, 'fasta';

# 2/ String guess
my $string = ">test1 no comment
agtgctagctagctagctagct
>test2 no comment
gtagttatgc
";
ok $guesser = Bio::Tools::GuessSeqFormat->new(
    -text => $string,
), 'String input';
is $guesser->guess, 'fasta';

# 3/ Filehandle guess
SKIP: {
    test_skip(-tests => 2, -requires_modules => [qw(IO::String)]);
    require IO::String;
    my $fh = IO::String->new($string);
    ok $guesser = Bio::Tools::GuessSeqFormat->new(
        -fh => $fh,
    ), 'Filehandle input';
    is $guesser->guess, 'fasta';
}


#
# Test behavior with unknown format
#

is $guesser = Bio::Tools::GuessSeqFormat->new(
    -file => test_input_file('test.waba'), # Bio::SearchIO::waba
)->guess, undef, 'Unknown file format';

throws_ok {
    Bio::SeqIO->new( -file=>test_input_file('test.waba') );
} qr/Could not guess format/;


#
# Test SeqIO formats
#

my @fmts = qw{ace embl fasta fastq game gcg genbank pir raw swiss tab};

for my $fmt (@fmts) {
    SKIP: {
        test_skip(
            -tests => 4,
            -requires_modules => [qw(XML::Writer XML::Parser::PerlSAX)]
        ) if $fmt eq 'game';
        test_skip(
            -tests => 4,
            -requires_module  => 'Data::Stag'
        ) if $fmt eq 'swiss';

        my $guess = Bio::Tools::GuessSeqFormat->new(
            -file => test_input_file("test.$fmt"),
        )->guess;
        is $guess, $fmt, "$fmt format";

        ok my $input = Bio::SeqIO->new( -file=>test_input_file("test.$fmt") );
        ok my $seq = $input->next_seq();
        isa_ok $seq, 'Bio::PrimarySeqI';
    }
}


#
# Test AlignIO formats
#

@fmts = qw{clustalw fasta fastq mase mega msf nexus pfam phylip prodom selex};

## Instead of this, we should instead have a mock of those modules.
## Two reasons: 1) this modules are dependent on ourselves so this
## tests will only be triggered when updating. 2) it's not really our
## job to check if the other module reads file correctly, we just need
## to ensure that it's called to read the file.
SKIP: {
    test_skip(-tests => 4,
              -requires_modules => ['Bio::AlignIO::stockholm']);
    push(@fmts, 'stockholm');
}


my %skip_module = map {$_=>1} qw{ fastq };

for my $fmt (@fmts) {
    my $guess = Bio::Tools::GuessSeqFormat->new(
        -file => test_input_file("testaln.$fmt")
    )->guess;
    is $guess, $fmt, "$fmt format";
    next if $skip_module{$fmt};

    ok my $input = Bio::AlignIO->new( -file=>test_input_file("testaln.$fmt") );
    ok my $seq = $input->next_aln();
    isa_ok $seq, 'Bio::Align::AlignI';
}


#
# Other formats
#

my %fmts = (
   blast    => test_input_file('blastp2215.blast'),
   gcgblast => test_input_file('test.gcgblast'),
   vcf      => test_input_file('example.vcf'),
);

while (my ($fmt, $file) = each %fmts) {
    my $guess = Bio::Tools::GuessSeqFormat->new(
        -file => $file,
    )->guess;
    is $guess, $fmt, "$fmt format";
}