Raw content of Bio::EnsEMBL::Variation::DBSQL::VariationGroupFeatureAdaptor # # Ensembl module Bio::EnsEMBL::Variation::DBSQL::VariationGroupFeatureAdaptor # # Copyright (c) 2004 Ensembl # # You may distribute this module under the same terms as perl itself # # =head1 NAME Bio::EnsEMBL::Variation::DBSQL::VariationGroupFeatureAdaptor =head1 SYNOPSIS $vdb = Bio::EnsEMBL::Variation::DBSQL::DBAdaptor->new(...); $db = Bio::EnsEMBL::DBSQL::DBAdaptor->new(...); # tell the variation database where core database information can be # be found $vdb->dnadb($db); $vga = $vdb->get_VariationGroupAdaptor(); $vgfa = $vdb->get_VariationGroupFeatureAdaptor(); $sa = $db->get_SliceAdaptor(); # Get a VariationFeature by its internal identifier $vgf = $vgfa->fetch_by_dbID(145); # get all VariationFeatures in a region $slice = $sa->fetch_by_region('chromosome', 'X', 1e6, 2e6); foreach $vgf (@{$vgfa->fetch_all_by_Slice($slice)}) { print $vgf->start(), '-', $vgf->end(), ' ', $vgf->allele_string(), "\n"; } # fetch all genome hits for a particular variation group $vg = $vga->fetch_by_name('PERLEGEN:B000002'); foreach $vgf (@{$vgfa->fetch_all_by_VariationGroup($vg)}) { print $vgf->seq_region_name(), $vgf->seq_region_start(), '-', $vgf->seq_region_end(),"\n"; } =head1 DESCRIPTION This adaptor provides database connectivity for VariationGroupFeature objects. Genomic locations of VariationGroups can be obtained from the variation database using this adaptor. See the base class BaseFeatureAdaptor for more information. =head1 AUTHOR - Graham McVicker =head1 CONTACT Post questions to the Ensembl development list ensembl-dev@ebi.ac.uk =head1 METHODS =cut use strict; use warnings; package Bio::EnsEMBL::Variation::DBSQL::VariationGroupFeatureAdaptor; use Bio::EnsEMBL::Variation::VariationGroupFeature; use Bio::EnsEMBL::DBSQL::BaseFeatureAdaptor; our @ISA = ('Bio::EnsEMBL::DBSQL::BaseFeatureAdaptor'); =head2 fetch_all_by_Variation Arg [1] : Bio::EnsEMBL:Variation::Variation $var Example : my @vfs = @{$vfa->fetch_all_by_Variation($var)}; Description: Retrieves all variation features for a given variation. Most variations should only hit the genome once and only a return a single variation feature. Returntype : reference to list Bio::EnsEMBL::Variation::VariationFeature Exceptions : throw on bad argument Caller : general Status : At Risk =cut sub fetch_all_by_VariationGroup { my $self = shift; my $vg = shift; if(!ref($vg) || !$vg->isa('Bio::EnsEMBL::Variation::VariationGroup')) { throw('Bio::EnsEMBL::Variation::VariationGroup arg expected'); } if(!defined($vg->dbID())) { throw("VariationGroup arg must have defined dbID"); } return $self->generic_fetch("vgf.variation_group_id = ".$vg->dbID()); } # method used by superclass to construct SQL sub _tables { return ['variation_group_feature', 'vgf']; } sub _columns { return qw( vgf.variation_group_feature_id vgf.seq_region_id vgf.seq_region_start vgf.seq_region_end vgf.seq_region_strand vgf.variation_group_id vgf.variation_group_name ); } sub _objs_from_sth { my ($self, $sth, $mapper, $dest_slice) = @_; # # This code is ugly because an attempt has been made to remove as many # function calls as possible for speed purposes. Thus many caches and # a fair bit of gymnastics is used. # my $sa = $self->db()->dnadb()->get_SliceAdaptor(); my @features; my %slice_hash; my %sr_name_hash; my %sr_cs_hash; my ($variation_group_feature_id, $seq_region_id, $seq_region_start, $seq_region_end, $seq_region_strand, $variation_group_id, $variation_group_name ); $sth->bind_columns(\$variation_group_feature_id, \$seq_region_id, \$seq_region_start, \$seq_region_end, \$seq_region_strand, \$variation_group_id, \$variation_group_name); my $asm_cs; my $cmp_cs; my $asm_cs_vers; my $asm_cs_name; my $cmp_cs_vers; my $cmp_cs_name; if($mapper) { $asm_cs = $mapper->assembled_CoordSystem(); $cmp_cs = $mapper->component_CoordSystem(); $asm_cs_name = $asm_cs->name(); $asm_cs_vers = $asm_cs->version(); $cmp_cs_name = $cmp_cs->name(); $cmp_cs_vers = $cmp_cs->version(); } my $dest_slice_start; my $dest_slice_end; my $dest_slice_strand; my $dest_slice_length; if($dest_slice) { $dest_slice_start = $dest_slice->start(); $dest_slice_end = $dest_slice->end(); $dest_slice_strand = $dest_slice->strand(); $dest_slice_length = $dest_slice->length(); } FEATURE: while($sth->fetch()) { #get the slice object my $slice = $slice_hash{"ID:".$seq_region_id}; if(!$slice) { $slice = $sa->fetch_by_seq_region_id($seq_region_id); $slice_hash{"ID:".$seq_region_id} = $slice; $sr_name_hash{$seq_region_id} = $slice->seq_region_name(); $sr_cs_hash{$seq_region_id} = $slice->coord_system(); } # # remap the feature coordinates to another coord system # if a mapper was provided # if($mapper) { my $sr_name = $sr_name_hash{$seq_region_id}; my $sr_cs = $sr_cs_hash{$seq_region_id}; ($sr_name,$seq_region_start,$seq_region_end,$seq_region_strand) = $mapper->fastmap($sr_name, $seq_region_start, $seq_region_end, $seq_region_strand, $sr_cs); #skip features that map to gaps or coord system boundaries next FEATURE if(!defined($sr_name)); #get a slice in the coord system we just mapped to if($asm_cs == $sr_cs || ($cmp_cs != $sr_cs && $asm_cs->equals($sr_cs))) { $slice = $slice_hash{"NAME:$sr_name:$cmp_cs_name:$cmp_cs_vers"} ||= $sa->fetch_by_region($cmp_cs_name, $sr_name,undef, undef, undef, $cmp_cs_vers); } else { $slice = $slice_hash{"NAME:$sr_name:$asm_cs_name:$asm_cs_vers"} ||= $sa->fetch_by_region($asm_cs_name, $sr_name, undef, undef, undef, $asm_cs_vers); } } # # If a destination slice was provided convert the coords # If the dest_slice starts at 1 and is foward strand, nothing needs doing # if($dest_slice) { if($dest_slice_start != 1 || $dest_slice_strand != 1) { if($dest_slice_strand == 1) { $seq_region_start = $seq_region_start - $dest_slice_start + 1; $seq_region_end = $seq_region_end - $dest_slice_start + 1; } else { my $tmp_seq_region_start = $seq_region_start; $seq_region_start = $dest_slice_end - $seq_region_end + 1; $seq_region_end = $dest_slice_end - $tmp_seq_region_start + 1; $seq_region_strand *= -1; } #throw away features off the end of the requested slice if($seq_region_end < 1 || $seq_region_start > $dest_slice_length) { next FEATURE; } } $slice = $dest_slice; } push @features, Bio::EnsEMBL::Variation::VariationGroupFeature->new (-start => $seq_region_start, -end => $seq_region_end, -strand => $seq_region_strand, -slice => $slice, -variation_group_name => $variation_group_name, -variation_group_id => $variation_group_id, -adaptor => $self, -dbID => $variation_group_feature_id); } return \@features; } =head2 list_dbIDs Arg [1] : none Example : @feature_ids = @{$simple_feature_adaptor->list_dbIDs()}; Description: Gets an array of internal ids for all simple features in the current db Returntype : list of ints Exceptions : none Caller : general Status : At Risk =cut sub list_dbIDs { my $self = shift; return $self->_list_dbIDs('variation_feature'); } 1;