HavanaAdder documentation.

Bio::EnsEMBL::Analysis::RunnableDB::HavanaAdder

No package variables defined.

Bio::EnsEMBL::Analysis::Config::GeneBuild::General qw ( GB_INPUTID_REGEX )

Bio::EnsEMBL::Analysis::Config::HavanaAdder qw ( GB_ENSEMBL_INPUT_GENETYPE HAVANA_GENE_OUTPUT_BIOTYPE MERGED_GENE_OUTPUT_BIOTYPE ENSEMBL_GENE_OUTPUT_BIOTYPE MERGED_TRANSCRIPT_OUTPUT_TYPE )

Bio::EnsEMBL::Analysis::Runnable::HavanaAdder

Bio::EnsEMBL::Analysis::RunnableDB

Bio::EnsEMBL::Analysis::RunnableDB::BaseGeneBuild

Bio::EnsEMBL::Utils::Exception qw ( throw warning )

    my $obj = Bio::EnsEMBL::Analysis::RunnableDB::HavanaAdder->new(
								    -db        => $db,
								    -input_id  => $id,
								    );
    $obj->fetch_input
    $obj->run

    my @newfeatures = $obj->output;

sub addgenebuilder {

    my ($self,$arg,$contig) = @_;
    
    if (defined($arg) && defined($contig)) {
	$self->{_genebuilder}{$contig->id} = $arg;
    } 
    else {
	$self->throw("Wrong number of inputs [$arg,$contig]\n");
    }
}

############################################################

}

sub fetch_input {

    my( $self) = @_;
    
    $self->throw("No input id") unless defined($self->input_id);
    
    $self->fetch_sequence();

    my $discarded_db = $self->get_dbadaptor("DISCARDED_DB");

    print "DISCARDED GENE DB: ", $discarded_db->dbname,"\n";

    # database where the genebuild produced genes are
    my $ensembl_db = $self->get_dbadaptor("PSEUDO_DB") ;

    print "ENSEMBL DB : ",  $ensembl_db->dbname,"\n";

    my $havana_db = $self->get_dbadaptor("HAVANA_DB") ;
     
    print "HAVANA DB : ",  $havana_db->dbname,"\n";
    
    my $ref_db = $self->get_dbadaptor("REFERENCE_DB");

    print $self->input_id,"\n";

    my $slice = $ref_db->get_SliceAdaptor->fetch_by_name($self->input_id);

    print $slice,"\n";
   
    $self->query($slice);

    print "QUERY: ",$self->query->seq_region_name,"\n";
    my $genebuilder = new Bio::EnsEMBL::Analysis::Runnable::HavanaAdder
      (
       '-slice'   => $self->query,
       '-input_id' => $self->input_id,
      );
    $genebuilder->discarded_db($discarded_db);
    $genebuilder->ensembl_db($ensembl_db);
    $genebuilder->havana_db($havana_db);
     
    # store the object and the piece of genomic where it will run
    $self->addgenebuilder($genebuilder,$self->query);
    
}

############################################################

}

sub get_genebuilders {

    my ($self) = @_;
    
    return $self->{_genebuilder};
}

############################################################

}

sub input_id {

    my ($self,$arg) = @_;
    
    if (defined($arg)) {
	$self->{_input_id} = $arg;
    }
    
    return $self->{_input_id};
}

############################################################

}

sub new {

    my ($class,@args) = @_;

    my $self = $class->SUPER::new(@args);    
           
    return $self;
}

############################################################

}

sub output {

    my ($self, @genes ) = @_;
    unless ( $self->{_output} ){
	$self->{_output} = [];
    }
    if (@genes){
	push( @{$self->{_output}}, @genes );
    }
    return @{$self->{_output}};
}

############################################################



1;

}

sub run {

    my ($self) = @_;
    
    # get a hash, with keys = contig/slice and value = genebuilder object
    my $genebuilders = $self->get_genebuilders;
    
    my @genes;
    foreach my $contig (keys %{ $genebuilders } ) {
      my $query = $genebuilders->{$contig}->query;
      
      #print(STDERR "GeneBuilding for $contig\n");
      
      $genebuilders->{$contig}->build_Genes;
      
      @genes = $genebuilders->{$contig}->final_genes;
    }
    
    $self->output( @genes );
}

############################################################

# override the evil RunnableDB output method:

}

sub write_output {

  my($self,@genes) = @_;
  
  # write genes out to a different database from the one we read genewise genes from.
  my $db = $self->get_dbadaptor("GENEBUILD_DB") ;
  # sort out analysis
  
  my $analysis = $self->analysis;
  unless ($analysis){
    $self->throw("an analysis logic name must be defined in the command line");
  }
  
  my %contighash;
  my $gene_adaptor = $db->get_GeneAdaptor;
  
  # this now assummes that we are building on a single VC.
  my $genebuilders = $self->get_genebuilders;
    
  foreach my $contig ( keys %$genebuilders ){
    my $vc = $genebuilders->{$contig}->query;
      
    @genes = $genebuilders->{$contig}->final_genes;
    
    return unless ($#genes >= 0);
    my @newgenes;
    
    foreach my $gene (@genes) { 
      my %trans_types;
      $gene->analysis($analysis);
      #$gene->type($GB_GENE_OUTPUT_BIOTYPE);
      # poke the caches
      my %s_pfhash;
      foreach my $tran (@{$gene->get_all_Transcripts}) {
        $trans_types{$tran->biotype} = 1;
        #$tran->stable_id(undef);
        my @tsf = @{$tran->get_all_supporting_features};
               
        my @exons= @{$tran->get_all_Exons};
        my $tln = $tran->translation;
        $tln->{'stable_id'} = undef;
        
        foreach my $exon (@exons) {
          my @esf = @{$exon->get_all_supporting_features};
          #$exon->{'stable_id'} = undef;
        }
      }
      my @total_biotypes;
      foreach my $t_biotype (keys %trans_types){
        push (@total_biotypes, $t_biotype);
      }
      if (scalar(@total_biotypes)>1 || (scalar(@total_biotypes) == 1 &&
             $total_biotypes[0] eq $MERGED_TRANSCRIPT_OUTPUT_TYPE)){
        $gene->biotype($MERGED_GENE_OUTPUT_BIOTYPE);
      }elsif(scalar(@total_biotypes) == 1 && 
            $total_biotypes[0] eq $GB_ENSEMBL_INPUT_GENETYPE){
        $gene->biotype($ENSEMBL_GENE_OUTPUT_BIOTYPE);
      }else{
        $gene->biotype($HAVANA_GENE_OUTPUT_BIOTYPE);
      }
      # store
      eval {
        $gene_adaptor->store($gene);
        #print STDERR "wrote gene " . $gene->dbID . " to database ".
        #   $gene->adaptor->db->dbname."\n";
      }; 
      if( $@ ) {
        warning("UNABLE TO WRITE GENE:\n$@");
      }
    }   
  } 
  return 1;   
}

############################################################

}

General documentation

Describe contact details here

The rest of the documentation details each of the object methods.
Internal methods are usually preceded with a _

addgenebuilder	No description	Code
fetch_input	Description	Code
get_genebuilders	No description	Code
input_id	No description	Code
new	Description	Code
output	No description	Code
run	No description	Code
write_output	Description	Code