Raw content of BioMart::Formatter::FASTA # $Id: FASTA.pm,v 1.4 2008/04/09 12:52:34 syed Exp $ # # BioMart module for BioMart::Formatter::TXT # # You may distribute this module under the same terms as perl # itself. # POD documentation - main docs before the code. =head1 NAME BioMart::Formatter::FASTA =head1 SYNOPSIS The FASTA Formatter returns whitespace separated tabular data for a BioMart query's ResultTable =head1 DESCRIPTION When given a BioMart::ResultTable containing the results of a BioMart::Query the FASTA Formatter will return tabular output with one line for each row of data in the ResultTable and single spaces separating the individual entries in each row. The getDisplayNames and getFooterText can be used to return appropiately formatted headers and footers respectively =head1 AUTHOR - Syed Haider, Damian Smedley =head1 CONTACT This module is part of the BioMart project http://www.biomart.org Questions can be posted to the mart-dev mailing list: mart-dev@ebi.ac.uk =head1 METHODS =cut package BioMart::Formatter::FASTA; use strict; use warnings; # Extends BioMart::FormatterI use base qw(BioMart::FormatterI); sub _new { my ($self) = @_; $self->SUPER::_new(); } sub processQuery { my ($self, $query) = @_; $self->set('original_attributes',[@{$query->getAllAttributes()}]) if ($query->getAllAttributes()); $self->set('query',$query); return $query; } sub nextRow { my $self = shift; my $rtable = $self->get('result_table'); my $row = $rtable->nextRow; if (!$row){ return; } my $array_length = @{$row}; map { $_ = '' unless defined ($_); } @$row; # get rid of unitialized-value warning message my $header_atts = join "|",@{$row}[1..$array_length-1]; #chop $header_atts; my $seq = ${$row}[0]; ### SPECIAL LOGIC FOR SNP SEQUENCES, to make them agree with FASTA FORMAT ### THE * would suggest the split between two sequnce snp sequences ### The allele would go into header, which comes from genomic sequence ### in tags separating two snp sequences and that gets replaced by _, ### this tag look like %allele%. eg. %A/T%. I am using this assumption ### of % sign as TO DATE i have never seen a residue string containing ### % sign, ### for those how want to post process them in a different way, may use _ ### as a splitting point if ($seq =~ m/\%(.*)\%/) { $header_atts .= "|$1"; ## also substiture with * $seq =~ s/\%.*\%/\_/; } ######################################################################## $seq =~ s/(\w{60})/$1\n/g; return ">" . $header_atts . "\n" . $seq ."\n"; } sub getDisplayNames { my $self = shift; return ''; } sub isSpecial { return 1; } 1;