3 # BioPerl module for Bio::TreeIO::newick
5 # Cared for by Jason Stajich <jason@bioperl.org>
7 # Copyright Jason Stajich
9 # You may distribute this module under the same terms as perl itself
11 # POD documentation - main docs before the code
15 Bio::TreeIO::newick - TreeIO implementation for parsing
16 Newick/New Hampshire/PHYLIP format.
20 # do not use this module directly
22 my $treeio = Bio::TreeIO->new(-format => 'newick',
23 -file => 't/data/LOAD_Ccd1.dnd');
24 my $tree = $treeio->next_tree;
28 This module handles parsing and writing of Newick/PHYLIP/New Hampshire format.
34 User feedback is an integral part of the evolution of this and other
35 Bioperl modules. Send your comments and suggestions preferably to the
36 Bioperl mailing list. Your participation is much appreciated.
38 bioperl-l@bioperl.org - General discussion
39 http://bioperl.org/wiki/Mailing_lists - About the mailing lists
43 Report bugs to the Bioperl bug tracking system to help us keep track
44 of the bugs and their resolution. Bug reports can be submitted via the
47 http://bugzilla.open-bio.org/
49 =head1 AUTHOR - Jason Stajich
51 Email jason-at-bioperl-dot-org
55 The rest of the documentation details each of the object methods.
56 Internal methods are usually preceded with a _
61 # Let the code begin...
64 package Bio
::TreeIO
::newick
;
65 use vars
qw($DefaultBootstrapStyle);
68 use Bio::Event::EventGeneratorI;
70 #initialize some package variables, could use 'our' but fails in perl < 5.6
72 $DefaultBootstrapStyle = 'traditional';
73 use base qw(Bio::TreeIO);
79 Args : -print_count => boolean default is false
80 -bootstrap_style => set the bootstrap style (one of nobranchlength,
82 -order_by => set the order by sort method
83 (see L<Bio::Node::Node::each_Descendent()> )
89 $self->SUPER::_initialize
(@_);
90 my ($print_count,$style,$order_by) = $self->_rearrange([qw(PRINT_COUNT
94 $self->print_tree_count($print_count || 0);
95 $self->bootstrap_style($style || $DefaultBootstrapStyle);
96 $self->order_by($order_by) if defined $order_by;
104 Usage : my $tree = $treeio->next_tree
105 Function: Gets the next tree in the stream
106 Returns : L<Bio::Tree::TreeI>
115 return unless $_ = $self->_readline;
118 my $despace = sub {my $dirty = shift; $dirty =~ s/\s+//gs; return $dirty};
119 my $dequote = sub {my $dirty = shift; $dirty =~ s/^"?\s*(.+?)\s*"?$/$1/; return $dirty};
120 s/([^"]*)(".+?")([^"]*)/$despace->($1) . $dequote->($2) . $despace->($3)/egsx;
121 if( s/^\s*\[([^\]]+)\]// ) {
125 if( $match =~ /([-\d\.+]+)/ ) {
130 $self->debug("entry is $_\n");
131 # my $empty = chr(20);
133 # replace empty labels with a tag
134 # s/\(,/\($empty,/ig;
137 # s/,\)/,$empty\)/ig;
141 $self->_eventHandler->start_document;
142 my ($prev_event,$lastevent,$id) = ('','','');
143 foreach my $ch ( split(//,$_) ) {
145 my $tree = $self->_eventHandler->end_document($chars);
146 $tree->score($score) if defined $score;
147 if( $self->internal_node_id eq 'bootstrap' ) {
148 $tree->move_id_to_bootstrap;
151 } elsif( $ch eq '(' ) {
153 $self->_eventHandler->start_element( {'Name' => 'tree'} );
154 } elsif($ch eq ')' ) {
155 if( length($chars) ) {
156 if( $lastevent eq ':' ) {
157 $self->_eventHandler->start_element( { 'Name' => 'branch_length'});
158 $self->_eventHandler->characters($chars);
159 $self->_eventHandler->end_element( {'Name' => 'branch_length'});
160 $lastevent = $prev_event;
162 $self->debug("internal node, id with no branchlength is $chars\n");
163 $self->_eventHandler->start_element( { 'Name' => 'node' } );
164 $self->_eventHandler->start_element( { 'Name' => 'id' } );
165 $self->_eventHandler->characters($chars);
166 $self->_eventHandler->end_element( { 'Name' => 'id' } );
170 if( $lastevent ne ')' ) {
174 $self->_eventHandler->start_element({'Name' => 'leaf'});
175 $self->_eventHandler->characters($leafstatus);
176 $self->_eventHandler->end_element({'Name' => 'leaf'});
179 $self->_eventHandler->start_element( {'Name' => 'node'} );
182 $self->_eventHandler->end_element( {'Name' => 'node'} );
183 $self->_eventHandler->end_element( {'Name' => 'tree'} );
185 } elsif ( $ch eq ',' ) {
186 if( length($chars) ) {
187 if( $lastevent eq ':' ) {
188 $self->_eventHandler->start_element( { 'Name' => 'branch_length'});
189 $self->_eventHandler->characters($chars);
190 $self->_eventHandler->end_element( {'Name' => 'branch_length'});
191 $lastevent = $prev_event;
194 $self->debug("leaf id with no branchlength is $chars\n");
195 $self->_eventHandler->start_element( { 'Name' => 'node' } );
196 $self->_eventHandler->start_element( { 'Name' => 'id' } );
197 $self->_eventHandler->characters($chars);
198 $self->_eventHandler->end_element( { 'Name' => 'id' } );
202 $self->_eventHandler->start_element( { 'Name' => 'node' } );
205 if( $lastevent ne ')' ) {
208 $self->_eventHandler->start_element({'Name' => 'leaf'});
209 $self->_eventHandler->characters($leafstatus);
210 $self->_eventHandler->end_element({'Name' => 'leaf'});
211 $self->_eventHandler->end_element( {'Name' => 'node'} );
214 } elsif( $ch eq ':' ) {
215 $self->debug("id with a branchlength coming is $chars\n");
216 $self->_eventHandler->start_element( { 'Name' => 'node' } );
217 $self->_eventHandler->start_element( { 'Name' => 'id' } );
218 $self->_eventHandler->characters($chars);
219 $self->_eventHandler->end_element( { 'Name' => 'id' } );
226 $prev_event = $lastevent;
235 Usage : $treeio->write_tree($tree);
236 Function: Write a tree out to data stream in newick/phylip format
238 Args : L<Bio::Tree::TreeI> object
243 my ($self,@trees) = @_;
244 my $orderby = $self->order_by;
245 my $bootstrap_style = $self->bootstrap_style;
246 if( $self->print_tree_count ){
247 $self->_print(sprintf(" %d\n",scalar @trees));
249 my $nl = $self->newline_each_node;
250 foreach my $tree( @trees ) {
252 if( ! defined $tree || ref($tree) =~ /ARRAY/i ||
253 ! $tree->isa('Bio::Tree::TreeI') ) {
254 $self->throw("Calling write_tree with non Bio::Tree::TreeI object\n");
256 my @data = _write_tree_Helper
($tree->get_root_node,
261 chomp($data[-1]);# remove last newline
262 $self->_print(join(",\n", @data), ";\n");
264 $self->_print(join(',', @data), ";\n");
267 $self->flush if $self->_flush_on_write && defined $self->_fh;
271 sub _write_tree_Helper
{
272 my ($node,$style,$orderby,$nl) = @_;
273 $style = '' unless defined $style;
274 return () if (!defined $node);
277 foreach my $n ( $node->each_Descendent($orderby) ) {
278 push @data, _write_tree_Helper
($n,$style,$orderby,$nl);
281 # let's explicitly write out the bootstrap if we've got it
282 my $id = $node->id_output;
283 my $bs = $node->bootstrap; # bs better not have any spaces?
284 $bs =~ s/\s+//g if defined $bs;
285 my $bl = $node->branch_length;
288 $data[0] = "(\n" . $data[0];
291 $data[0] = "(" . $data[0];
295 if( $node->is_Leaf ) {
296 $node->debug("node is a leaf! This is unexpected...");
299 if( ! defined $bl || ! length($bl) ||
300 ($style && $style =~ /nobranchlength/i) ) {
302 } elsif( defined $bl && length($bl) ) {
303 $data[-1] .= "$id:$bl";
308 if( ! defined $bl || ! length($bl) ||
309 ($style && $style =~ /nobranchlength/i) ) {
311 if( defined $id || defined $bs ) {
312 $data[-1] .= defined $bs ?
$bs : $id;
314 } elsif( $style =~ /molphy/i ) {
324 $data[-1] .= "[$bs]";
327 # traditional style of
328 # ((A:1,B:2)81:3); where 3 is internal node branch length
329 # and 81 is bootstrap/node label
330 if( defined $bs || defined $id ) {
331 $data[-1] .= defined $bs ?
"$bs:$bl" : "$id:$bl";
332 } elsif( $bl =~ /\#/ ) {
339 } elsif( defined $id || defined $bl ) {
342 if( ! defined $bl || ! length($bl) ||
343 ($style && $style =~ /nobranchlength/i) ) {
345 } elsif( defined $bl && length($bl) ) {
355 =head2 print_tree_count
357 Title : print_tree_count
358 Usage : $obj->print_tree_count($newval)
359 Function: Get/Set flag for printing out the tree count (paml,protml way)
360 Returns : value of print_tree_count (a scalar)
361 Args : on set, new value (a scalar or undef, optional)
366 sub print_tree_count
{
368 return $self->{'_print_tree_count'} = shift if @_;
369 return $self->{'_print_tree_count'} || 0;
372 =head2 bootstrap_style
374 Title : bootstrap_style
375 Usage : $obj->bootstrap_style($newval)
376 Function: A description of how bootstraps and branch lengths are
377 written, as the ID part of the internal node or else in []
378 in the branch length (Molphy-like; I am sure there is a
379 better name for this but am not sure where to go for some
380 sort of format documentation)
382 If no branch lengths are requested then no bootstraps are usually
383 written (unless someone REALLY wants this functionality...)
385 Can take on strings which contain the possible values of
386 'nobranchlength' --> don't draw any branch lengths - this
387 is helpful if you don't want to have to
388 go through and delete branch len on all nodes
389 'molphy' --> draw bootstraps (100) like
390 (A:0.11,B:0.22):0.33[100];
391 'traditional' --> draw bootstraps (100) like
392 (A:0.11,B:0.22)100:0.33;
393 Returns : value of bootstrap_style (a scalar)
394 Args : on set, new value (a scalar or undef, optional)
404 if( $val !~ /^nobranchlength|molphy|traditional/i ) {
405 $self->warn("requested an unknown bootstrap style $val, expect one of nobranchlength,molphy,traditional, not updating value. Default is $DefaultBootstrapStyle\n");
407 $self->{'_bootstrap_style'} = $val;
410 return $self->{'_bootstrap_style'} || $DefaultBootstrapStyle;
416 Usage : $obj->order_by($newval)
417 Function: Allow node order to be specified (typically "alpha")
418 See L<Bio::Node::Node::each_Descendent()>
419 Returns : value of order_by (a scalar)
420 Args : on set, new value (a scalar or undef, optional)
428 return $self->{'order_by'} = shift if @_;
429 return $self->{'order_by'};