# $Id: TreeIO.pm 16123 2009-09-17 12:57:27Z cjfields $ # # BioPerl module for Bio::TreeIO # # Please direct questions and support issues to # # Cared for by Jason Stajich # # Copyright Jason Stajich # # You may distribute this module under the same terms as perl itself # POD documentation - main docs before the code =head1 NAME Bio::TreeIO - Parser for Tree files =head1 SYNOPSIS { use Bio::TreeIO; my $treeio = Bio::TreeIO->new('-format' => 'newick', '-file' => 'globin.dnd'); while( my $tree = $treeio->next_tree ) { print "Tree is ", $tree->number_nodes, "\n"; } } =head1 DESCRIPTION This is the driver module for Tree reading from data streams and flatfiles. This is intended to be able to create Bio::Tree::TreeI objects. =head1 FEEDBACK =head2 Mailing Lists User feedback is an integral part of the evolution of this and other Bioperl modules. Send your comments and suggestions preferably to the Bioperl mailing list. Your participation is much appreciated. bioperl-l@bioperl.org - General discussion http://bioperl.org/wiki/Mailing_lists - About the mailing lists =head2 Support Please direct usage questions or support issues to the mailing list: I rather than to the module maintainer directly. Many experienced and reponsive experts will be able look at the problem and quickly address it. Please include a thorough description of the problem with code and data examples if at all possible. =head2 Reporting Bugs Report bugs to the Bioperl bug tracking system to help us keep track of the bugs and their resolution. Bug reports can be submitted via the web: http://bugzilla.open-bio.org/ =head1 AUTHOR - Jason Stajich Email jason-at-bioperl-dot-org =head1 CONTRIBUTORS Allen Day Eallenday@ucla.eduE =head1 APPENDIX The rest of the documentation details each of the object methods. Internal methods are usually preceded with a _ =cut # Let the code begin... package Bio::TreeIO; use strict; # Object preamble - inherits from Bio::Root::Root use Bio::TreeIO::TreeEventBuilder; use base qw(Bio::Root::Root Bio::Root::IO Bio::Event::EventGeneratorI Bio::Factory::TreeFactoryI); use constant INTERNAL_NODE_ID => 'id'; # id or bootstrap, default is 'id' =head2 new Title : new Usage : my $obj = Bio::TreeIO->new(); Function: Builds a new Bio::TreeIO object Returns : Bio::TreeIO Args : a hash. useful keys: -format : Specify the format of the file. Supported formats: newick Newick tree format nexus Nexus tree format nhx NHX tree format svggraph SVG graphical representation of tree tabtree ASCII text representation of tree lintree lintree output format -internal_node_id : what is stored in the internal node ids, bootstrap values or ids, coded as 'bootstrap' or 'id' =cut sub new { my($caller,@args) = @_; my $class = ref($caller) || $caller; # or do we want to call SUPER on an object if $caller is an # object? if( $class =~ /Bio::TreeIO::(\S+)/ ) { my ($self) = $class->SUPER::new(@args); $self->_initialize(@args); return $self; } else { my %param = @args; @param{ map { lc $_ } keys %param } = values %param; # lowercase keys my $format = $param{'-format'} || $class->_guess_format( $param{'-file'} || $ARGV[0] ) || 'newick'; $format = "\L$format"; # normalize capitalization to lower case # normalize capitalization return unless( $class->_load_format_module($format) ); return "Bio::TreeIO::$format"->new(@args); } } =head2 next_tree Title : next_tree Usage : my $tree = $treeio->next_tree; Function: Gets the next tree off the stream Returns : Bio::Tree::TreeI or undef if no more trees Args : none =cut sub next_tree{ my ($self) = @_; $self->throw("Cannot call method next_tree on Bio::TreeIO object must use a subclass"); } =head2 write_tree Title : write_tree Usage : $treeio->write_tree($tree); Function: Writes a tree onto the stream Returns : none Args : Bio::Tree::TreeI =cut sub write_tree{ my ($self,$tree) = @_; $self->throw("Cannot call method write_tree on Bio::TreeIO object must use a subclass"); } =head2 attach_EventHandler Title : attach_EventHandler Usage : $parser->attatch_EventHandler($handler) Function: Adds an event handler to listen for events Returns : none Args : Bio::Event::EventHandlerI =cut sub attach_EventHandler{ my ($self,$handler) = @_; return if( ! $handler ); if( ! $handler->isa('Bio::Event::EventHandlerI') ) { $self->warn("Ignoring request to attach handler ".ref($handler). ' because it is not a Bio::Event::EventHandlerI'); } $self->{'_handler'} = $handler; return; } =head2 _eventHandler Title : _eventHandler Usage : private Function: Get the EventHandler Returns : Bio::Event::EventHandlerI Args : none =cut sub _eventHandler{ my ($self) = @_; return $self->{'_handler'}; } sub _initialize { my($self, @args) = @_; $self->{'_handler'} = undef; my $internal_node_id; $self->{'internal_node_id'} = INTERNAL_NODE_ID; ($self->{'newline_each_node'},$internal_node_id) = $self->_rearrange ([qw(NEWLINE_EACH_NODE INTERNAL_NODE_ID)],@args); # initialize the IO part $self->_initialize_io(@args); $self->attach_EventHandler(Bio::TreeIO::TreeEventBuilder->new (-verbose => $self->verbose(), @args)); $self->internal_node_id($internal_node_id) if defined $internal_node_id; } =head2 _load_format_module Title : _load_format_module Usage : *INTERNAL TreeIO stuff* Function: Loads up (like use) a module at run time on demand Example : Returns : Args : =cut sub _load_format_module { my ($self,$format) = @_; my $module = "Bio::TreeIO::" . $format; my $ok; eval { $ok = $self->_load_module($module); }; if ( $@ ) { print STDERR <newline_each_node($newval) Function: Get/set newline each node flag which is only applicable for writing tree formats for nhx and newick, will print a newline after each node or paren Returns : value of newline_each_node (boolean) Args : on set, new value (a boolean or undef, optional) =cut sub newline_each_node{ my $self = shift; return $self->{'newline_each_node'} = shift if @_; return $self->{'newline_each_node'}; } =head2 internal_node_id Title : internal_node_id Usage : $obj->internal_node_id($newval) Function: Internal Node Id type, coded as 'bootstrap' or 'id' Default is 'id' Returns : value of internal_node_id (a scalar) Args : on set, new value (a scalar or undef, optional) =cut sub internal_node_id{ my $self = shift; my $val = shift; if( defined $val ) { if( $val =~ /^b/i ) { $val = 'bootstrap'; } elsif( $val =~ /^i/ ) { $val = 'id'; } else { $self->warn("Unknown value $val for internal_node_id not resetting value\n"); } return $self->{'internal_node_id'} = $val; } return $self->{'internal_node_id'}; } =head2 _guess_format Title : _guess_format Usage : $obj->_guess_format($filename) Function: Example : Returns : guessed format of filename (lower case) Args : =cut sub _guess_format { my $class = shift; return unless $_ = shift; return 'newick' if /\.(dnd|newick|nh)$/i; return 'nhx' if /\.(nhx)$/i; return 'phyloxml' if /\.(xml)$/i; return 'svggraph' if /\.svg$/i; return 'lintree' if( /\.(lin|lintree)$/i ); } sub DESTROY { my $self = shift; $self->close(); } sub TIEHANDLE { my $class = shift; return bless {'treeio' => shift},$class; } sub READLINE { my $self = shift; return $self->{'treeio'}->next_tree() unless wantarray; my (@list,$obj); push @list,$obj while $obj = $self->{'treeio'}->next_tree(); return @list; } sub PRINT { my $self = shift; $self->{'treeio'}->write_tree(@_); } 1;