Raw content of Bio::SeqFeature::PositionProxy
# $Id: PositionProxy.pm,v 1.4 2002/10/22 07:38:41 lapp Exp $
#
# BioPerl module for Bio::SeqFeature::PositionProxy
#
# Cared for by Ewan Birney
#
# Copyright Ewan Birney
#
# You may distribute this module under the same terms as perl itself
# POD documentation - main docs before the code
=head1 NAME
Bio::SeqFeature::PositionProxy - handle features when truncation/revcom sequences span a feature
=head1 SYNOPSIS
$proxy = new Bio::SeqFeature::PositionProxy ( -loc => $loc,
-parent => $basefeature);
$seq->add_SeqFeature($feat);
=head1 DESCRIPTION
PositionProxy is a Proxy Sequence Feature to handle truncation
and revcomp without duplicating all the data within the sequence features.
It holds a new location for a sequence feature and the original feature
it came from to provide the additional annotation information.
=head1 FEEDBACK
=head2 Mailing Lists
User feedback is an integral part of the evolution of this and other
Bioperl modules. Send your comments and suggestions preferably to one
of the Bioperl mailing lists. Your participation is much appreciated.
bioperl-l@bioperl.org - General discussion
http://bio.perl.org/MailList.html - About the mailing lists
=head2 Reporting Bugs
Report bugs to the Bioperl bug tracking system to help us keep track
the bugs and their resolution. Bug reports can be submitted via email
or the web:
bioperl-bugs@bio.perl.org
http://bugzilla.bioperl.org/
=head1 AUTHOR - Ewan Birney
Ewan Birney Ebirney@sanger.ac.ukE
=head1 DEVELOPERS
This class has been written with an eye out of inheritence. The fields
the actual object hash are:
_gsf_tag_hash = reference to a hash for the tags
_gsf_sub_array = reference to an array for sub arrays
_gsf_start = scalar of the start point
_gsf_end = scalar of the end point
_gsf_strand = scalar of the strand
=head1 APPENDIX
The rest of the documentation details each of the object
methods. Internal methods are usually preceded with a _
=cut
# Let the code begin...
package Bio::SeqFeature::PositionProxy;
use vars qw(@ISA);
use strict;
use Bio::Root::Root;
use Bio::SeqFeatureI;
use Bio::Tools::GFF;
@ISA = qw(Bio::Root::Root Bio::SeqFeatureI);
sub new {
my ($caller, @args) = @_;
my $self = $caller->SUPER::new(@args);
my ($feature,$location) = $self->_rearrange([qw(PARENT LOC)],@args);
if( !defined $feature || !ref $feature || !$feature->isa('Bio::SeqFeatureI') ) {
$self->throw("Must have a parent feature, not a [$feature]");
}
if( $feature->isa("Bio::SeqFeature::PositionProxy") ) {
$feature = $feature->parent();
}
if( !defined $location || !ref $location || !$location->isa('Bio::LocationI') ) {
$self->throw("Must have a location, not a [$location]");
}
return $self;
}
=head2 location
Title : location
Usage : my $location = $seqfeature->location()
Function: returns a location object suitable for identifying location
of feature on sequence or parent feature
Returns : Bio::LocationI object
Args : none
=cut
sub location {
my($self, $value ) = @_;
if (defined($value)) {
unless (ref($value) and $value->isa('Bio::LocationI')) {
$self->throw("object $value pretends to be a location but ".
"does not implement Bio::LocationI");
}
$self->{'_location'} = $value;
}
elsif (! $self->{'_location'}) {
# guarantees a real location object is returned every time
$self->{'_location'} = Bio::Location::Simple->new();
}
return $self->{'_location'};
}
=head2 parent
Title : parent
Usage : my $sf = $proxy->parent()
Function: returns the seqfeature parent of this proxy
Returns : Bio::SeqFeatureI object
Args : none
=cut
sub parent {
my($self, $value ) = @_;
if (defined($value)) {
unless (ref($value) and $value->isa('Bio::SeqFeatureI')) {
$self->throw("object $value pretends to be a location but ".
"does not implement Bio::SeqFeatureI");
}
$self->{'_parent'} = $value;
}
return $self->{'_parent'};
}
=head2 start
Title : start
Usage : $start = $feat->start
$feat->start(20)
Function: Get
Returns : integer
Args : none
=cut
sub start {
my ($self,$value) = @_;
return $self->location->start($value);
}
=head2 end
Title : end
Usage : $end = $feat->end
$feat->end($end)
Function: get
Returns : integer
Args : none
=cut
sub end {
my ($self,$value) = @_;
return $self->location->end($value);
}
=head2 length
Title : length
Usage :
Function:
Example :
Returns :
Args :
=cut
sub length {
my ($self) = @_;
return $self->end - $self->start() + 1;
}
=head2 strand
Title : strand
Usage : $strand = $feat->strand()
$feat->strand($strand)
Function: get/set on strand information, being 1,-1 or 0
Returns : -1,1 or 0
Args : none
=cut
sub strand {
my ($self,$value) = @_;
return $self->location->strand($value);
}
=head2 attach_seq
Title : attach_seq
Usage : $sf->attach_seq($seq)
Function: Attaches a Bio::Seq object to this feature. This
Bio::Seq object is for the *entire* sequence: ie
from 1 to 10000
Example :
Returns : TRUE on success
Args :
=cut
sub attach_seq {
my ($self, $seq) = @_;
if ( !defined $seq || !ref $seq || ! $seq->isa("Bio::PrimarySeqI") ) {
$self->throw("Must attach Bio::PrimarySeqI objects to SeqFeatures");
}
$self->{'_gsf_seq'} = $seq;
# attach to sub features if they want it
foreach my $sf ( $self->sub_SeqFeature() ) {
if ( $sf->can("attach_seq") ) {
$sf->attach_seq($seq);
}
}
return 1;
}
=head2 seq
Title : seq
Usage : $tseq = $sf->seq()
Function: returns the truncated sequence (if there) for this
Example :
Returns : sub seq on attached sequence bounded by start & end
Args : none
=cut
sub seq {
my ($self, $arg) = @_;
if ( defined $arg ) {
$self->throw("Calling SeqFeature::PositionProxy->seq with an argument. You probably want attach_seq");
}
if ( ! exists $self->{'_gsf_seq'} ) {
return undef;
}
# assumming our seq object is sensible, it should not have to yank
# the entire sequence out here.
my $seq = $self->{'_gsf_seq'}->trunc($self->start(), $self->end());
if ( $self->strand == -1 ) {
$seq = $seq->revcom;
}
return $seq;
}
=head2 entire_seq
Title : entire_seq
Usage : $whole_seq = $sf->entire_seq()
Function: gives the entire sequence that this seqfeature is attached to
Example :
Returns :
Args :
=cut
sub entire_seq {
my ($self) = @_;
return undef unless exists($self->{'_gsf_seq'});
return $self->{'_gsf_seq'};
}
=head2 seqname
Title : seqname
Usage : $obj->seq_id($newval)
Function: There are many cases when you make a feature that you
do know the sequence name, but do not know its actual
sequence. This is an attribute such that you can store
the seqname.
This attribute should *not* be used in GFF dumping, as
that should come from the collection in which the seq
feature was found.
Returns : value of seqname
Args : newvalue (optional)
=cut
sub seqname {
my ($obj,$value) = @_;
if ( defined $value ) {
$obj->{'_gsf_seqname'} = $value;
}
return $obj->{'_gsf_seqname'};
}
=head2 Proxies
These functions chain back to the parent for all non sequence related stuff.
=cut
=head2 primary_tag
Title : primary_tag
Usage : $tag = $feat->primary_tag()
Function: Returns the primary tag for a feature,
eg 'exon'
Returns : a string
Args : none
=cut
sub primary_tag{
my ($self,@args) = @_;
return $self->parent->primary_tag();
}
=head2 source_tag
Title : source_tag
Usage : $tag = $feat->source_tag()
Function: Returns the source tag for a feature,
eg, 'genscan'
Returns : a string
Args : none
=cut
sub source_tag{
my ($self) = @_;
return $self->parent->source_tag();
}
=head2 has_tag
Title : has_tag
Usage : $tag_exists = $self->has_tag('some_tag')
Function:
Returns : TRUE if the specified tag exists, and FALSE otherwise
Args :
=cut
sub has_tag{
my ($self,$tag) = @_;
return $self->parent->has_tag($tag);
}
=head2 each_tag_value
Title : each_tag_value
Usage : @values = $self->each_tag_value('some_tag')
Function:
Returns : An array comprising the values of the specified tag.
Args :
=cut
sub each_tag_value {
my ($self,$tag) = @_;
return $self->parent->each_tag_value($tag);
}
=head2 all_tags
Title : all_tags
Usage : @tags = $feat->all_tags()
Function: gives all tags for this feature
Returns : an array of strings
Args : none
=cut
sub all_tags{
my ($self) = @_;
return $self->parent->all_tags();
}