1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
|
#---------------------------------------------------------
#ISA ProtMatrix, HAS InstanceSite
=head1 NAME
Bio::Matrix::PSM::ProtPsm - handle combination of site matricies
=head1 SYNOPSIS
use Bio::Matrix::PSM::IO;
#To get a ProtPsm object from a file use the Psm parser:
my $psmIO = Bio::Matrix::PSM::IO->new(-format=>'psiblast', -file=>$file);
# Now go through all entities in the file with next_psm, which
# returns a Psm object see Bio::Matrix::PSM::IO for detailed
# documentation (matrix predictions or matrix sequence matches or
# both):
while (my $psm=$psmIO->next_psm) {
my %psm_header = $psm->header;
my $ic = $psm_header{IC};
my $sites = $psm_header{sites};
my $width = $psm_header{width};
my $score = $psm_header{e_val};
my $IUPAC = $psm->IUPAC;
my $instances = $psm->instances;
foreach my $instance (@{$instances}) {
my $id = $instance->primary_id;
#Do something with the id
}
}
=head1 DESCRIPTION
To handle a combination of site matrices and/or their corresponding sequence
matches (instances). This object inherits from Bio::Matrix::PSM::ProtMatrix, so
you can methods from that class. It may hold also an array of
Bio::Matrix::PSM::InstanceSite object, but you will have to retrieve these
through Bio::Matrix::PSM::ProtPsm-E<gt>instances method (see below). To some
extent this is an expanded ProtMatrix object, holding data from analysis that
also deal with sequence matches of a particular matrix.
=head2 DESIGN ISSUES
This does not make too much sense to me I am mixing PSM with PSM sequence
matches Though they are very closely related, I am not satisfied by the way
this is implemented here. Heikki suggested different objects when one has
something like meme But does this mean we have to write a different objects for
mast, meme, transfac, theiresias, etc.? To me the best way is to return
SiteMatrix object + arrray of InstanceSite objects and then mast will return
undef for SiteMatrix and transfac will return undef for InstanceSite. Probably
I cannot see some other design issues that might arise from such approach, but
it seems more straightforward. Hilmar does not like this because it is an
exception from the general BioPerl rules. Should I leave this as an option?
Also the header rightfully belongs the driver object, and could be retrieved as
hashes. I do not think it can be done any other way, unless we want to create
even one more object with very unclear content.
=head1 FEEDBACK
=head2 Mailing Lists
User feedback is an integral part of the evolution of this
and other Bioperl modules. Send your comments and suggestions preferably
to one of the Bioperl mailing lists.
Your participation is much appreciated.
bioperl-l@bioperl.org - General discussion
http://bioperl.org/wiki/Mailing_lists - About the mailing lists
=head2 Support
Please direct usage questions or support issues to the mailing list:
I<bioperl-l@bioperl.org>
rather than to the module maintainer directly. Many experienced and
reponsive experts will be able look at the problem and quickly
address it. Please include a thorough description of the problem
with code and data examples if at all possible.
=head2 Reporting Bugs
Report bugs to the Bioperl bug tracking system to help us keep track
the bugs and their resolution. Bug reports can be submitted via the
web:
https://github.com/bioperl/bioperl-live/issues
=head1 AUTHOR - James Thompson
Email tex@biosysadmin.com
=head1 DISCLAIMER
This software is provided "as is" without warranty of any kind.
=head1 SEE ALSO
ProtMatrix, meme, transfac, psiblast, InstanceSite
=head1 APPENDIX
=cut
# Let the code begin...
package Bio::Matrix::PSM::ProtPsm;
$Bio::Matrix::PSM::ProtPsm::VERSION = '1.7.8';
use Bio::Matrix::PSM::InstanceSite;
use strict;
use base qw(Bio::Matrix::PSM::ProtMatrix Bio::Matrix::PSM::PsmI Bio::Annotation::Collection);
@Bio::Matrix::PSM::Psm::HEADER = qw(e_val sites IC width);
=head2 new
Title : new
Usage : my $psm = Bio::Matrix::PSM::ProtPsm->new(
-pS => [ '0', '33', '0', '16', '1', '12', '11', '25' ],
-pF => [ '0', '0', '2', '0', '3', '0', '0', '0' ],
-pT => [ '0', '8', '7', '10', '1', '2', '7', '8' ],
-pN => [ '0', '0', '2', '13', '0', '36', '1', '4' ],
-pK => [ '0', '5', '0', '13', '1', '15', '0', '2' ],
-pY => [ '0', '0', '0', '0', '0', '0', '0', '0' ],
-pE => [ '0', '41', '1', '12', '0', '0', '0', '15' ],
-pV => [ '0', '3', '9', '0', '2', '0', '3', '1' ],
-pQ => [ '0', '0', '0', '15', '0', '4', '0', '3' ],
-pM => [ '100', '0', '66', '0', '2', '0', '0', '0' ],
-pC => [ '0', '0', '0', '0', '0', '0', '0', '0' ],
-pL => [ '0', '0', '8', '0', '25', '0', '4', '0' ],
-pA => [ '0', '10', '1', '9', '2', '0', '22', '16' ],
-pW => [ '0', '0', '0', '0', '0', '0', '0', '0' ],
-pP => [ '0', '0', '0', '0', '3', '1', '45', '0' ],
-pH => [ '0', '0', '0', '0', '0', '0', '1', '0' ],
-pD => [ '0', '0', '1', '7', '2', '2', '0', '22' ],
-pR => [ '0', '0', '0', '3', '0', '27', '0', '0' ],
-pI => [ '0', '0', '3', '0', '59', '1', '2', '3' ],
-pG => [ '0', '0', '0', '1', '0', '0', '4', '1' ],
-IC => $ic,
-sites => $istes,
-width => $width,
-e_val => $e_val,
-instances => $instances,
}
Function: Creates a new Bio::Matrix::PSM::ProtPsm object
Throws :
Example :
Returns : Bio::Matrix::PSM::Psm object
Args : hash
=cut
sub new {
my ($caller,@args) = @_;
my $class = ref($caller) || $caller;
my $self = $class->SUPER::new(@args);
$self->{'_annotation'} = {}; #Init from Annotation::Collection
$self->_typemap(Bio::Annotation::TypeManager->new()); #same
($self->{instances})=$self->_rearrange(['INSTANCES'], @args);
return $self;
}
=head2 instances
Title : instances
Usage : my @instances=@{$psm->instances};
Function: Gets/sets the instances (Bio::Matrix::PSM::InstanceSite objects)
associated with the Psm object
Throws :
Example :
Returns : array reference (Bio::Matrix::PSM::InstanceSite objects)
Args : array reference (Bio::Matrix::PSM::InstanceSite objects)
=cut
sub instances {
my $self = shift;
my $prev = $self->{instances};
if (@_) { $self->{instances} = shift; }
return $prev;
}
=head2 header
Title : header
Usage : my %header=$psm->header;
my $ic=$psm->header('IC');
Function: Gets the general information, common for most files,
dealing with PSM such as information content (IC), score
(e-value, etc.), number of sites (sites) and width. This
list may expand. The current list should be in
@Bio::Matrix::PSM::Psm::HEADER. Returns an epty list if an
argument is supplied that is not in
@Bio::Matrix::PSM::meme::HEADER.
Throws :
Example :
Returns : hash or string
Args : string (IC, e_val...)
=cut
sub header {
my $self = shift;
return if ($self->{end});
my %header;
if (@_) {my $key=shift; return $self->{$key}; }
foreach my $key (@Bio::Matrix::PSM::ProtPsm::HEADER) {
$header{$key}=$self->{$key};
}
return %header;
}
=head2 matrix
Title : matrix
Usage : my $matrix = $psm->matrix;
Function: Gets/sets the SiteMatrix related information
Throws :
Example :
Returns : Bio::Matrix::PSM::SiteMatrix objects
Args : Bio::Matrix::PSM::SiteMatrix objects
=cut
sub matrix {
my $self = shift;
if (@_) {
my $matrix = shift;
my @alphabet = $self->alphabet;
foreach my $char (@alphabet) {
$self->{"log$char"} = $matrix->{"log$char"};
$self->{"prob$char"} = $matrix->{"prob$char"};
}
$self->{IC} = $matrix->IC;
$self->{e_val} = $matrix->e_val;
$self->{id} = $matrix->id;
}
return $self;
}
1;
|