Bio::SeqIO::strider: move into its own distribution
[bioperl-live.git] / lib / Bio / Range.pm
blob6dc61c0d58d4f92bd30dc566e97632d5b100fac9
2 # BioPerl module for Bio::Range
4 # Please direct questions and support issues to <bioperl-l@bioperl.org>
6 # Cared for by Heikki Lehvaslaiho <heikki-at-bioperl-dot-org>
8 # Copywright Matthew Pocock
10 # You may distribute this module under the same terms as perl itself
12 # POD documentation - main docs before the code
15 =head1 NAME
17 Bio::Range - Pure perl RangeI implementation
19 =head1 SYNOPSIS
21 $range = Bio::Range->new(-start=>10, -end=>30, -strand=>+1);
22 $r2 = Bio::Range->new(-start=>15, -end=>200, -strand=>+1);
24 print join(', ', $range->union($r2)), "\n";
25 print join(', ', $range->intersection($r2)), "\n";
27 print $range->overlaps($r2), "\n";
28 print $range->contains($r2), "\n";
30 =head1 DESCRIPTION
32 This provides a pure perl implementation of the BioPerl range
33 interface.
35 Ranges are modeled as having (start, end, length, strand). They use
36 Bio-coordinates - all points E<gt>= start and E<lt>= end are within the
37 range. End is always greater-than or equal-to start, and length is
38 greather than or equal to 1. The behaviour of a range is undefined if
39 ranges with negative numbers or zero are used.
41 So, in summary:
43 length = end - start + 1
44 end >= start
45 strand = (-1 | 0 | +1)
47 =head1 FEEDBACK
49 =head2 Mailing Lists
51 User feedback is an integral part of the evolution of this and other
52 Bioperl modules. Send your comments and suggestions preferably to one
53 of the Bioperl mailing lists. Your participation is much appreciated.
55 bioperl-l@bioperl.org - General discussion
56 http://bioperl.org/wiki/Mailing_lists - About the mailing lists
58 =head2 Support
60 Please direct usage questions or support issues to the mailing list:
62 I<bioperl-l@bioperl.org>
64 rather than to the module maintainer directly. Many experienced and
65 reponsive experts will be able look at the problem and quickly
66 address it. Please include a thorough description of the problem
67 with code and data examples if at all possible.
69 =head2 Reporting Bugs
71 Report bugs to the Bioperl bug tracking system to help us keep track
72 the bugs and their resolution. Bug reports can be submitted via the web:
74 https://github.com/bioperl/bioperl-live/issues
76 =head1 AUTHOR - Heikki Lehvaslaiho
78 Email heikki-at-bioperl-dot-org
80 =head1 APPENDIX
82 The rest of the documentation details each of the object
83 methods. Internal methods are usually preceded with a _
85 =cut
87 package Bio::Range;
89 use strict;
90 use Carp;
91 use integer;
94 use base qw(Bio::Root::Root Bio::RangeI);
96 =head1 Constructors
98 =head2 new
100 Title : new
101 Usage : $range = Bio::Range->new(-start => 100, -end=> 200, -strand = +1);
102 Function: generates a new Bio::Range
103 Returns : a new range
104 Args : -strand (defaults to 0) and any two of (-start, -end, -length),
105 the third will be calculated
107 =cut
109 sub new {
110 my ($caller, @args) = @_;
111 my $self = $caller->SUPER::new(@args);
112 my ($strand, $start, $end, $length) =
113 $self->_rearrange([qw(STRAND
114 START
115 END
116 LENGTH
117 )],@args);
118 $self->strand($strand || 0);
120 if(defined $start ) {
121 $self->start($start);
122 if(defined $end) {
123 $self->end($end);
124 } elsif(defined $length) {
125 $self->end($self->start()+ $length - 1);
127 } elsif(defined $end && defined $length ) {
128 $self->end($end);
129 $self->start($self->end() - $length + 1);
131 return $self;
134 =head2 unions
136 Title : unions
137 Usage : @unions = Bio::Range->unions(@ranges);
138 Function: generate a list of non-intersecting Bio::Range objects
139 from a list of Bio::Range objects which may intersect
140 Returns : a list of Bio::Range objects
141 Args : a list of Bio::Range objects
144 =cut
146 sub unions {
147 my ($class,@i) = @_;
149 my $i = 0;
150 my %i = map { $i++ => $_ } @i;
152 my $lastsize = scalar(keys %i);
154 do {
156 foreach my $j (sort { $i{$a}->start <=> $i{$b}->start } keys %i){
157 foreach my $k (sort { $i{$a}->start <=> $i{$b}->start } keys %i){
159 #it may have been replaced by a union under the key of
160 #the overlapping range, we are altering the hash in-place
161 next unless $i{$j};
163 next if $i{$k}->end < $i{$j}->start;
164 last if $i{$k}->start > $i{$j}->end;
166 if($i{$j}->overlaps($i{$k})){
167 my($start,$end,$strand) = $i{$j}->union($i{$k});
168 delete($i{$k});
169 $i{$j} = Bio::Range->new( -start => $start , -end => $end , -strand => $strand );
174 goto DONE if scalar(keys %i) == $lastsize;
175 $lastsize = scalar(keys %i);
177 #warn $lastsize;
179 } while(1);
181 DONE:
183 return values %i;
187 =head1 Member variable access
189 These methods let you get at and set the member variables
191 =head2 start
193 Title : start
194 Function : return or set the start co-ordinate
195 Example : $s = $range->start(); $range->start(7);
196 Returns : the value of the start co-ordinate
197 Args : optionally, the new start co-ordinate
198 Overrides: Bio::RangeI::start
200 =cut
202 sub start {
203 my ($self,$value) = @_;
204 if( defined $value) {
205 $self->throw("'$value' is not an integer.\n")
206 unless $value =~ /^[-+]?\d+$/;
207 $self->{'start'} = $value;
209 return $self->{'start'};
212 =head2 end
214 Title : end
215 Function : return or set the end co-ordinate
216 Example : $e = $range->end(); $range->end(2000);
217 Returns : the value of the end co-ordinate
218 Args : optionally, the new end co-ordinate
219 Overrides: Bio::RangeI::end
221 =cut
223 sub end {
225 my ($self,$value) = @_;
226 if( defined $value) {
227 $self->throw("'$value' is not an integer.\n")
228 unless $value =~ /^[-+]?\d+$/;
229 $self->{'end'} = $value;
231 return $self->{'end'};
234 =head2 strand
236 Title : strand
237 Function : return or set the strandedness
238 Example : $st = $range->strand(); $range->strand(-1);
239 Returns : the value of the strandedness (-1, 0 or 1)
240 Args : optionally, the new strand - (-1, 0, 1) or (-, ., +).
241 Overrides: Bio::RangeI::strand
243 =cut
247 my %VALID_STRAND = (
248 -1 => -1,
249 0 => 0,
250 1 => 1,
251 '+' => 1,
252 '-' => -1,
253 '.' => 0
256 sub strand {
257 my $self = shift;
258 if(@_) {
259 my $val = shift;
260 if (exists $VALID_STRAND{$val}) {
261 $self->{'strand'} = $VALID_STRAND{$val};
262 } else {
263 $self->throw("Invalid strand: $val");
266 return $self->{'strand'};
271 =head2 length
273 Title : length
274 Function : returns the length of this range
275 Example : $length = $range->length();
276 Returns : the length of this range, equal to end - start + 1
277 Args : if you attempt to set the length an exception will be thrown
278 Overrides: Bio::RangeI::Length
280 =cut
282 sub length {
283 my $self = shift;
284 if(@_) {
285 confess ref($self), "->length() is read-only";
287 return $self->end() - $self->start() + 1;
290 =head2 toString
292 Title : toString
293 Function: stringifies this range
294 Example : print $range->toString(), "\n";
295 Returns : a string representation of this range
297 =cut
299 sub toString {
300 my $self = shift;
301 return "(${\$self->start}, ${\$self->end}) strand=${\$self->strand}";
304 =head1 Boolean Methods
306 These methods return true or false.
308 $range->overlaps($otherRange) && print "Ranges overlap\n";
310 =head2 overlaps
312 Title : overlaps
313 Usage : if($r1->overlaps($r2)) { do stuff }
314 Function : tests if $r2 overlaps $r1
315 Args : a range to test for overlap with
316 Returns : true if the ranges overlap, false otherwise
317 Inherited: Bio::RangeI
319 =head2 contains
321 Title : contains
322 Usage : if($r1->contains($r2) { do stuff }
323 Function : tests whether $r1 totally contains $r2
324 Args : a range to test for being contained
325 Returns : true if the argument is totally contained within this range
326 Inherited: Bio::RangeI
328 =head2 equals
330 Title : equals
331 Usage : if($r1->equals($r2))
332 Function : test whether $r1 has the same start, end, length as $r2
333 Args : a range to test for equality
334 Returns : true if they are describing the same range
335 Inherited: Bio::RangeI
337 =head1 Geometrical methods
339 These methods do things to the geometry of ranges, and return
340 triplets (start, end, strand) from which new ranges could be built.
342 =head2 intersection
344 Title : intersection
345 Usage : ($start, $stop, $strand) = $r1->intersection($r2)
346 Function : gives the range that is contained by both ranges
347 Args : a range to compare this one to
348 Returns : nothing if they do not overlap, or the range that they do overlap
349 Inherited: Bio::RangeI::intersection
351 =cut
353 =head2 union
355 Title : union
356 Usage : ($start, $stop, $strand) = $r1->union($r2);
357 : ($start, $stop, $strand) = Bio::Range->union(@ranges);
358 Function : finds the minimal range that contains all of the ranges
359 Args : a range or list of ranges
360 Returns : the range containing all of the ranges
361 Inherited: Bio::RangeI::union
363 =cut