2 # BioPerl module for Bio::Search::HSP::FastaHSP
4 # Please direct questions and support issues to <bioperl-l@bioperl.org>
6 # Cared for by Jason Stajich <jason@bioperl.org>
8 # Copyright Jason Stajich
10 # You may distribute this module under the same terms as perl itself
12 # POD documentation - main docs before the code
16 Bio::Search::HSP::FastaHSP - HSP object for FASTA specific data
20 # get a FastaHSP from a SearchIO stream
21 my $in = Bio::SearchIO->new(-format => 'fasta', -file => 'filename.fasta');
23 while( my $r = $in->next_result) {
24 while( my $hit = $r->next_result ) {
25 while( my $hsp = $hit->next_hsp ) {
26 print "smith-waterman score (if available): ",
27 $hsp->sw_score(),"\n";
34 Describe the object here
40 User feedback is an integral part of the evolution of this and other
41 Bioperl modules. Send your comments and suggestions preferably to
42 the Bioperl mailing list. Your participation is much appreciated.
44 bioperl-l@bioperl.org - General discussion
45 http://bioperl.org/wiki/Mailing_lists - About the mailing lists
49 Please direct usage questions or support issues to the mailing list:
51 I<bioperl-l@bioperl.org>
53 rather than to the module maintainer directly. Many experienced and
54 reponsive experts will be able look at the problem and quickly
55 address it. Please include a thorough description of the problem
56 with code and data examples if at all possible.
60 Report bugs to the Bioperl bug tracking system to help us keep track
61 of the bugs and their resolution. Bug reports can be submitted via the
64 https://github.com/bioperl/bioperl-live/issues
66 =head1 AUTHOR - Jason Stajich
68 Email jason-at-bioperl.org
72 The rest of the documentation details each of the object methods.
73 Internal methods are usually preceded with a _
78 # Let the code begin...
81 package Bio
::Search
::HSP
::FastaHSP
;
85 use base
qw(Bio::Search::HSP::GenericHSP);
90 Usage : my $obj = Bio::Search::HSP::FastaHSP->new();
91 Function: Builds a new Bio::Search::HSP::FastaHSP object
92 Returns : Bio::Search::HSP::FastaHSP
93 Args : -swscore => smith-waterman score
98 my($class,@args) = @_;
100 my $self = $class->SUPER::new
(@args);
102 my ($swscore, $evalue2) = $self->_rearrange([qw(SWSCORE EVALUE2)], @args);
104 defined $swscore && $self->sw_score($swscore);
106 defined $evalue2 && $self->evalue2($evalue2);
115 Usage : $obj->sw_score($newval)
116 Function: Get/Set Smith-Waterman score
117 Returns : value of sw_score
118 Args : newvalue (optional)
124 my ($self,$value) = @_;
125 if( defined $value || ! defined $self->{'_sw_score'} ) {
126 $value = 0 unless defined $value; # default value
127 $self->{'_sw_score'} = $value;
129 return $self->{'_sw_score'};
135 Usage : $obj->evalue2($newval)
136 Function: Get/Set E2() expectation value
137 Returns : value of evalue2
138 Args : newvalue (optional)
144 my ($self,$value) = @_;
145 if( defined $value || ! defined $self->{'_evalue2'} ) {
146 $value = 0 unless defined $value; # default value
147 $self->{'_evalue2'} = $value;
149 return $self->{'_evalue2'};
155 require Bio
::LocatableSeq
;
156 require Bio
::SimpleAlign
;
157 my $aln = Bio
::SimpleAlign
->new();
158 my $hs = $self->hit_string();
159 my $qs = $self->query_string();
161 # fasta reports some extra 'regional' sequence information
162 # we need to clear out first
163 # this seemed a bit insane to me at first, but it appears to
166 # modified to deal with LocatableSeq's end point verification and to deal
167 # with frameshifts (which shift the end points in translated sequences).
169 # we infer the end of the regional sequence where the first
170 # non space is in the homology string
171 # then we use the HSP->length to tell us how far to read
172 # to cut off the end of the sequence
174 my ($start, $rest) = (0, 0);
175 if( $self->homology_string() =~ /^(\s+)?(.*?)\s*$/ ) {
176 ($start, $rest) = ($1 ? CORE
::length($1) : 0, CORE
::length($2));
178 $self->debug("hs seq is '$hs'\n");
179 $self->debug("qs seq is '$qs'\n");
181 $hs = substr($hs, $start,$rest);
182 $qs = substr($qs, $start,$rest);
185 $seqonly =~ s/\s+//g;
186 my ($q_nm,$s_nm) = ($self->query->seq_id(),
187 $self->hit->seq_id());
188 unless( defined $q_nm && CORE
::length ($q_nm) ) {
191 unless( defined $s_nm && CORE
::length ($s_nm) ) {
194 $self->_calculate_seq_positions;
195 my $query = Bio
::LocatableSeq
->new('-seq' => $seqonly,
197 '-start' => $self->query->start,
198 '-end' => $self->query->end,
199 '-frameshifts' => (exists $self->{seqinds
}{_frameshiftRes_query
}) ?
200 $self->{seqinds
}{_frameshiftRes_query
} : undef,
201 '-mapping' => [1, $self->{_query_mapping
}],
202 -verbose
=> $self->verbose
205 $seqonly =~ s/\s+//g;
206 my $hit = Bio
::LocatableSeq
->new('-seq' => $seqonly,
208 '-start' => $self->hit->start,
209 '-end' => $self->hit->end,
210 '-frameshifts' => exists $self->{seqinds
}{_frameshiftRes_sbjct
} ?
211 $self->{seqinds
}{_frameshiftRes_sbjct
} : undef,
212 '-mapping' => [1, $self->{_hit_mapping
}],
213 -verbose
=> $self->verbose
215 $aln->add_seq($query);