File Coverage

blib/lib/Bio/Nexml/Factory.pm
Criterion Covered Total %
statement 36 320 11.2
branch 1 126 0.7
condition 0 59 0.0
subroutine 13 26 50.0
pod 10 11 90.9
total 60 542 11.0


line stmt bran cond sub pod time code
1             # $Id: Util.pm 15875 2009-07-21 19:20:00Z chmille4 $
2             #
3             # BioPerl module for Bio::Nexml::Factory
4             #
5             # Please direct questions and support issues to
6             #
7             # Cared for by Chase Miller
8             #
9             # Copyright Chase Miller
10             #
11             # You may distribute this module under the same terms as perl itself
12              
13             # POD documentation - main docs before the code
14              
15             =head1 NAME
16              
17             Bio::Nexml::Factory - A factory module for creating BioPerl and Bio::Phylo objects from/to nexml documents
18              
19             =head1 SYNOPSIS
20              
21             Do not use this module directly. It shoulde be used through
22             Bio::NexmlIO, Bio::SeqIO::nexml, Bio::AlignIO::nexml, or
23             Bio::TreeIO::nexml
24            
25              
26             =head1 DESCRIPTION
27              
28             This is a factory/utility module in the Nexml namespace. It contains
29             methods that are needed by multiple modules.
30              
31             This module handles the creation of BioPerl objects from Bio::Phylo
32             objects and vice versa, which is used to read and write nexml
33             documents to and from BioPerl objects.
34              
35             =head1 FEEDBACK
36              
37             =head2 Mailing Lists
38              
39             User feedback is an integral part of the evolution of this and other
40             Bioperl modules. Send your comments and suggestions preferably to
41             the Bioperl mailing list. Your participation is much appreciated.
42              
43             bioperl-l@bioperl.org - General discussion
44             http://bioperl.org/wiki/Mailing_lists - About the mailing lists
45              
46             =head2 Support
47              
48             Please direct usage questions or support issues to the mailing list:
49              
50             I
51              
52             rather than to the module maintainer directly. Many experienced and
53             reponsive experts will be able look at the problem and quickly
54             address it. Please include a thorough description of the problem
55             with code and data examples if at all possible.
56              
57             =head2 Reporting Bugs
58              
59             Report bugs to the Bioperl bug tracking system to help us keep track
60             of the bugs and their resolution. Bug reports can be submitted via
61             the web:
62              
63             https://github.com/bioperl/bioperl-live/issues
64              
65             =head1 AUTHOR - Chase Miller
66              
67             Email chmille4@gmail.com
68              
69             =head1 APPENDIX
70              
71             The rest of the documentation details each of the object methods.
72             Internal methods are usually preceded with a _
73              
74             =cut
75              
76              
77             #Let the code begin
78              
79             package Bio::Nexml::Factory;
80              
81 3     3   17 use strict;
  3         6  
  3         102  
82              
83             BEGIN {
84 3     3   320 use Bio::Root::Root;
  3         7  
  3         121  
85 3 50   3   182 unless (eval "require Bio::Phylo; 1") {
86 0         0 Bio::Root::Root->throw("Bio::Phylo package required; see http://www.nexml.org for download details");
87             }
88             }
89            
90 3     3   781 use Bio::Phylo::Factory;
  3         1994  
  3         16  
91 3     3   746 use Bio::Phylo::Matrices;
  3         52259  
  3         90  
92 3     3   1375 use Bio::Phylo::Matrices::Matrix;
  3         47772  
  3         29  
93 3     3   129 use Bio::Phylo::Matrices::Datum;
  3         9  
  3         20  
94 3     3   1389 use Bio::Phylo::Forest::Tree;
  3         59889  
  3         26  
95 3     3   102 use Bio::Phylo::Matrices;
  3         7  
  3         18  
96 3     3   67 use Bio::Phylo::IO;
  3         6  
  3         112  
97              
98 3     3   1638 use Bio::SeqFeature::Generic;
  3         11  
  3         116  
99              
100              
101 3     3   62 use base qw(Bio::Root::Root);
  3         10  
  3         7217  
102              
103             my $fac = Bio::Phylo::Factory->new();
104              
105              
106             =head2 new
107              
108             Title : new
109             Usage : my $obj = Bio::Nexml::Factory->new();
110             Function: Builds a new L object
111             Returns : L object
112             Args : none
113              
114             =cut
115              
116             sub new {
117 1     1 1 4 my($class,@args) = @_;
118 1         13 my $self = $class->SUPER::new(@args);
119             }
120              
121             #should all these creates be private methods?
122             # naah./maj
123              
124             =head2 create_bperl_aln
125              
126             Title : create_bperl_aln
127             Usage : my @alns = $factory->create_bperl_aln($objIO);
128             Function: Converts Bio::Phylo::Matrices::Matrix objects into L objects
129             Returns : an array of L objects
130             Args : Bio::NexmlIO, Bio::SeqIO, Bio::AlignIO, or Bio::TreeIO
131              
132             see [http://search.cpan.org/~rvosa/Bio-Phylo/lib/Bio/Phylo/Project.pm Bio::Phylo::Project]
133              
134             =cut
135              
136             sub create_bperl_aln {
137 0     0 1   my ($self, $caller) = @_;
138 0           my ($start, $end, $seq, $desc);
139 0           my $matrices = $caller->doc->get_matrices();
140 0           my @alns;
141            
142 0           foreach my $matrix (@$matrices)
143             {
144             #check if mol_type is something that makes sense to be an aln
145 0           my $mol_type = lc($matrix->get_type());
146 0 0 0       unless ($mol_type eq 'dna' || $mol_type eq 'rna' || $mol_type eq 'protein')
      0        
147             {
148 0           next;
149             # something for the back-burner: BioPerl has objects
150             # to handle arbitrary genotypes; might be cool to
151             # be able to create something besides alignments
152             # here .../maj
153             }
154            
155             #continue creating an aln
156 0           my $aln = Bio::SimpleAlign->new();
157 0           my $taxa = $matrix->get_taxa();
158            
159             # TODO: should $caller->{_ID} always be defined?
160             # ATM, this is a Bio::AlignIO::nexml stream...
161 0 0         $aln->{_Nexml_ID} = $caller->{_ID}? $caller->{_ID} . $taxa->get_xml_id : $taxa->get_xml_id;
162            
163 0           my $aln_feats = Bio::SeqFeature::Generic->new();
164 0           $aln_feats->add_tag_value('NexmlIO_ID', $caller->{_ID});
165             #check if there is a taxa associated with this alignment
166 0 0         if ($taxa) {
167 0           $aln_feats->add_tag_value('taxa_id', $taxa->get_xml_id());
168 0 0         $aln_feats->add_tag_value('taxa_label', $taxa->get_name()) if $taxa->get_name();
169            
170 0           my $taxon = $taxa->first;
171 0           while ($taxon) {
172 0           $aln_feats->add_tag_value('taxon', $taxon->get_name);
173 0           $taxon = $taxa->next;
174             }
175             }
176 0           $aln->add_SeqFeature($aln_feats);
177            
178 0           my $basename = $matrix->get_name();
179 0           $aln->id($basename);
180 0           my $seqNum = 0;
181 0           my$row = $matrix->first;
182 0           while ($row)
183             {
184 0           my $newSeq = $row->get_char();
185 0           my $rowlabel;
186 0           $seqNum++;
187            
188             #constuct seqID based on matrix label and row id
189 0           my $seqID = "$basename.row_$seqNum";
190            
191             #Check if theres a row label and if not default to seqID
192 0 0         if( !defined($rowlabel = $row->get_name())) {$rowlabel = $seqID;}
  0            
193              
194 0           $seq = Bio::LocatableSeq->new(
195             -seq => $newSeq,
196             -display_id => "$rowlabel",
197             #-description => $desc,
198             -alphabet => $mol_type,
199             );
200 0           my $seq_feats;
201             #check if there is a taxa associated w/ this alignment
202 0 0         if($taxa)
203             {
204 0 0         if (my $taxon = $taxa->get_by_name($row->get_taxon->get_name())) {
205             #attach taxon to each sequence by using the sequenceID because
206             #LocatableSeq does not support features
207 0           my $taxon_name = $taxon->get_name();
208 0           $seq_feats = Bio::SeqFeature::Generic->new();
209 0           $seq_feats->add_tag_value('taxon', "$taxon_name");
210 0           $seq_feats->add_tag_value('id', "$rowlabel");
211             }
212             }
213 0           $aln->add_seq($seq);
214 0           $aln->add_SeqFeature($seq_feats);
215 0           $self->debug("Reading r$rowlabel\n");
216            
217 0           $row = $matrix->next();
218             }
219 0           push (@alns, $aln);
220             }
221 0           return \@alns;
222             }
223              
224              
225             =head2 create_bperl_tree
226              
227             Title : create_bperl_tree
228             Usage : my @trees = $factory->create_bperl_seq($objIO);
229             Function: Converts Bio::Phylo::Forest::Tree objects into L objects
230             Returns : an array of L objects
231             Args : Bio::NexmlIO, Bio::SeqIO, Bio::AlignIO, or Bio::TreeIO
232              
233             see [http://search.cpan.org/~rvosa/Bio-Phylo/lib/Bio/Phylo/Project.pm Bio::Phylo::Project]
234              
235             =cut
236              
237             sub create_bperl_tree {
238 0     0 1   my($self, $caller) = @_;
239 0           my @trees;
240            
241 0           my $forests = $caller->doc->get_forests();
242            
243 0           foreach my $forest (@$forests)
244             {
245 0   0       my $basename = $forest->get_name() || '';
246 0           my $taxa = $forest->get_taxa();
247 0           my $taxa_label = $taxa->get_name();
248 0           my $taxa_id = $taxa->get_xml_id();
249            
250 0           my $t = $forest->first();
251            
252 0           while ($t)
253             {
254 0           my %created_nodes;
255 0           my $tree_id = $t->get_name();
256 0           my $tree = Bio::Tree::Tree->new(-id => "$basename.$tree_id");
257              
258             #set the taxa info of the tree
259 0 0         $tree->add_tag_value('taxa_label', $taxa_label) if defined($taxa_label);
260 0 0         $tree->add_tag_value('taxa_id', $taxa_id) if defined($taxa_id);
261              
262             # TODO: should $caller->{_ID} always be defined?
263             # ATM, this is a Bio::TreeIO::nexml stream...
264 0 0         $tree->add_tag_value('_NexmlIO_ID', $caller->{_ID}) if $caller->{_ID};
265            
266 0           my $taxon = $taxa->first;
267 0           while($taxon) {
268 0 0         $tree->add_tag_value('taxon', $taxon->get_name()) if defined($taxon->get_name);
269 0           $taxon = $taxa->next;
270             }
271            
272             #process terminals only, removing terminals as they get processed
273             #which inturn creates new terminals to process until the entire tree has been processed
274 0           my $terminals = $t->get_terminals();
275             # for(my $i=0; $i<@$terminals; $i++)
276 0           while (my $terminal = shift @$terminals)
277             {
278             # my $terminal = $$terminals[$i];
279 0           my $new_node_id = $terminal->get_name();
280 0           my $newNode;
281              
282 0 0         if(exists $created_nodes{$new_node_id})
283             {
284 0           $newNode = $created_nodes{$new_node_id};
285             }
286             else
287             {
288 0           $newNode = Bio::Tree::Node->new();
289 0   0       $new_node_id ||= 'internal_'.$newNode->_creation_id;
290 0           $newNode->id($new_node_id);
291              
292 0           $created_nodes{$new_node_id} = $newNode;
293             }
294            
295             #check if taxa data exists for the current node ($terminal)
296 0 0         if($taxa) {
297 0           my $taxon = $terminal->get_taxon();
298 0 0 0       $newNode->add_tag_value("taxon", $taxon->get_name()) if $taxon && $taxon->get_name;
299             }
300            
301             #check if you've reached the root of the tree and if so, stop.
302 0 0         if($terminal->is_root()) {
303 0           $tree->set_root_node($newNode);
304 0           last;
305             }
306            
307             #transfer attributes that apply to non-root only nodes
308 0           $newNode->branch_length($terminal->get_branch_length());
309            
310 0           my $parent = $terminal->get_parent();
311 0           my $parentID = $parent->get_name();
312 0 0         if(exists $created_nodes{$parentID})
313             {
314              
315 0           $created_nodes{$parentID}->add_Descendent($newNode);
316             }
317             else
318             {
319 0           my $parent_node = Bio::Tree::Node->new();
320 0   0       $parentID ||= 'internal_'.$parent_node->_creation_id;
321 0           $parent_node->id($parentID);
322 0           $parent_node->add_Descendent($newNode);
323 0           $created_nodes{$parentID} = $parent_node;
324             }
325             #remove processed node from tree
326 0           $parent->prune_child($terminal);
327            
328             #check if the parent of the removed node is now a terminal node and should be added for processing
329 0 0         if($parent->is_terminal())
330             {
331 0 0         push(@$terminals, $terminal->get_parent()) if $terminal->get_parent;
332             }
333             }
334 0           push @trees, $tree;
335 0           $t = $forest->next();
336             }
337             }
338 0           return \@trees;
339             }
340              
341             =head2 create_bperl_seq
342              
343             Title : create_bperl_seq
344             Usage : my @seqs = $factory->create_bperl_seq($objIO);
345             Function: Converts Bio::Phylo::Matrices::Datum objects into L objects
346             Returns : an array of L objects
347             Args : Bio::NexmlIO, Bio::SeqIO, Bio::AlignIO, or Bio::TreeIO
348              
349             see [http://search.cpan.org/~rvosa/Bio-Phylo/lib/Bio/Phylo/Project.pm Bio::Phylo::Project]
350              
351             =cut
352              
353             sub create_bperl_seq {
354 0     0 1   my($self, $caller) = @_;
355 0           my $matrices = $caller->doc->get_matrices();
356 0           my @seqs;
357            
358 0           foreach my $matrix (@$matrices)
359             {
360             #check if mol_type is something that makes sense to be a seq
361 0           my $mol_type = lc($matrix->get_type());
362 0 0 0       unless ($mol_type eq 'dna' || $mol_type eq 'rna' || $mol_type eq 'protein')
      0        
363             {
364 0           next;
365             }
366            
367 0           my $taxa = $matrix->get_taxa();
368 0           my $seqnum = 0;
369 0           my $taxa_id = $taxa->get_xml_id();
370 0           my $taxa_label = $taxa->get_name();
371 0           my $basename = $matrix->get_name();
372 0           my $row = $matrix->first;
373 0           while ($row)
374             {
375 0           my $newSeq = $row->get_char();
376 0           my $feat = Bio::SeqFeature::Generic->new();
377 0 0         $feat->add_tag_value('matrix_label', $matrix->get_name()) if defined($matrix->get_name);
378 0           $feat->add_tag_value('matrix_id', $matrix->get_xml_id());
379 0           $feat->add_tag_value('NexmlIO_ID', $caller->{_ID});
380 0 0         $feat->add_tag_value('taxa_id', $taxa_id) if defined($taxa_id);
381 0 0         $feat->add_tag_value('taxa_label', $taxa_label) if defined($taxa_label);
382            
383 0           $seqnum++;
384             #construct full sequence id by using bio::phylo "matrix label" and "row id"
385 0           my $seqID = "$basename.seq_$seqnum";
386 0           my $rowlabel;
387             #check if there is a label for the row, if not default to seqID
388 0 0         if (!defined ($rowlabel = $row->get_name())) {$rowlabel = $seqID;}
  0            
389 0           else {$seqID = $rowlabel;}
390            
391             #build the seq object using the factory create method
392 0           my $seqbuilder = Bio::Seq::SeqFactory->new('-type' => 'Bio::Seq');
393 0           my $seq = $seqbuilder->create(
394             -seq => $newSeq,
395             -id => $rowlabel,
396             -primary_id => $seqID,
397             #-desc => $fulldesc,
398             -alphabet => $mol_type,
399             -direct => 1,
400             );
401             # TODO: should $caller->{_ID} always be defined?
402             # ATM, this is a Bio::SeqIO::nexml stream...
403 0 0         $seq->{_Nexml_ID} = $caller->{_ID} ? $caller->{_ID} . $taxa_id : $taxa_id;
404 0 0         $seq->{_Nexml_matrix_ID} = $caller->{_ID} ? $caller->{_ID} . $matrix->get_xml_id() : $matrix->get_xml_id();
405            
406             #check if taxon linked to sequence if so create feature to attach to alignment
407 0 0         if ($taxa) {
408 0           my $taxon = $taxa->first;
409 0           while ($taxon) {
410 0 0         $feat->add_tag_value('taxon', $taxon->get_name) if defined($taxon->get_name);
411 0 0         if($taxon eq $row->get_taxon) {
412 0           my $taxon_name = $taxon->get_name();
413            
414 0 0         $feat->add_tag_value('my_taxon', "$taxon_name") if defined($taxon_name);
415 0           $feat->add_tag_value('id', $rowlabel);
416             }
417 0           $taxon = $taxa->next;
418             }
419             }
420 0           $seq->add_SeqFeature($feat);
421 0           push (@seqs, $seq);
422            
423 0           $row = $matrix->next;
424             }
425             }
426 0           return \@seqs;
427             }
428              
429             =head2 create_bphylo_tree
430              
431             Title : create_bphylo_tree
432             Usage : my $bphylo_tree = $factory->create_bphylo_tree($bperl_tree);
433             Function: Converts a L object into Bio::Phylo::Forest::Tree object
434             Returns : a Bio::Phylo::Forest::Tree object
435             Args : Bio::Tree::Tree object
436              
437             =cut
438              
439             sub create_bphylo_tree {
440 0     0 1   my ($self, $bptree, $taxa) = @_;
441             #most of the code below ripped form Bio::Phylo::Forest::Tree::new_from_bioperl()d
442            
443 0           my $tree = $fac->create_tree;
444 0           my $class = 'Bio::Phylo::Forest::Tree';
445            
446 0 0 0       if ( ref $bptree && $bptree->isa('Bio::Tree::TreeI') ) {
447 0           bless $tree, $class;
448 0           ($tree) = _copy_tree( $tree, $bptree->get_root_node, "", $taxa);
449            
450             # copy name
451 0           my $name = $bptree->id;
452 0 0         $tree->set_name( $name ) if defined $name;
453            
454             # copy score
455 0           my $score = $bptree->score;
456 0 0         $tree->set_score( $score ) if defined $score;
457             }
458             else {
459 0           $self->throw('Not a bioperl tree!');
460             }
461 0           return $tree;
462             }
463              
464              
465             sub _copy_tree {
466 0     0     my ( $tree, $bpnode, $parent, $taxa ) = @_;
467 0           my $node = create_bphylo_node($bpnode);
468 0           my $taxon;
469 0 0         if ($parent) {
470 0           $parent->set_child($node);
471             }
472 0 0         if (my $bptaxon_name = $bpnode->get_tag_values('taxon'))
473             {
474 0           $node->set_taxon($taxa->get_by_name($bptaxon_name));
475             }
476 0           $tree->insert($node);
477 0           foreach my $bpchild ( $bpnode->each_Descendent ) {
478 0           _copy_tree( $tree, $bpchild, $node, $taxa );
479             }
480 0           return $tree;
481             }
482              
483             =head2 create_bphylo_node
484              
485             Title : create_bphylo_node
486             Usage : my $bphylo_node = $factory->create_bphylo_node($bperl_node);
487             Function: Converts a L object into Bio::Phylo::Forest::Node object
488             Returns : a Bio::Phylo::Forest::Node object
489             Args : L object
490              
491             =cut
492              
493             sub create_bphylo_node {
494 0     0 1   my ($bpnode) = @_;
495 0           my $node = Bio::Phylo::Forest::Node->new();
496            
497             #mostly ripped from Bio::Phylo::Forest::Node->new_from_bioperl()
498             # copy name
499 0           my $name = $bpnode->id;
500 0 0         $node->set_name( $name ) if defined $name;
501            
502             # copy branch length
503 0           my $branch_length = $bpnode->branch_length;
504 0 0         $node->set_branch_length( $branch_length ) if defined $branch_length;
505            
506             # copy description
507 0           my $desc = $bpnode->description;
508 0 0         $node->set_desc( $desc ) if defined $desc;
509            
510             # copy bootstrap
511 0           my $bootstrap = $bpnode->bootstrap;
512 0 0 0       $node->set_score( $bootstrap ) if defined $bootstrap and looks_like_number $bootstrap;
513            
514             # copy other tags
515 0           for my $tag ( $bpnode->get_all_tags ) {
516 0           my @values = $bpnode->get_tag_values( $tag );
517 0           $node->set_generic( $tag => \@values );
518             }
519 0           return $node;
520             }
521            
522              
523             =head2 create_bphylo_aln
524              
525             Title : create_bphylo_aln
526             Usage : my $bphylo_aln = $factory->create_bphylo_aln($bperl_aln);
527             Function: Converts a L object into Bio::Phylo::Matrices::Matrix object
528             Returns : a Bio::Phylo::Matrices::Matrix object
529             Args : Bio::SimpleAlign object
530              
531             =cut
532              
533             sub create_bphylo_aln {
534            
535 0     0 1   my ($self, $aln, $taxa, @args) = @_;
536            
537             #most of the code below ripped from Bio::Phylo::Matrices::Matrix::new_from_bioperl()
538 0 0         if ( $aln->isa('Bio::Align::AlignI') ) {
539 0           $aln->unmatch;
540 0           $aln->map_chars('\.','-');
541 0           my @seqs = $aln->each_seq;
542 0           my ( $type, $missing, $gap, $matchchar );
543 0 0         if ( $seqs[0] ) {
544 0   0       $type = $seqs[0]->alphabet || $seqs[0]->_guess_alphabet || 'dna';
545             }
546             else {
547 0           $type = 'dna';
548             }
549            
550 0   0       my $matrix = $fac->create_matrix(
      0        
      0        
551             '-type' => $type,
552             '-special_symbols' => {
553             '-missing' => $aln->missing_char || '?',
554             '-matchchar' => $aln->match_char || '.',
555             '-gap' => $aln->gap_char || '-',
556             },
557             @args
558             );
559             # XXX create raw getter/setter pairs for annotation, accession, consensus_meta source
560 0           for my $field ( qw(description accession id annotation consensus_meta score source) ) {
561 0           $matrix->$field( $aln->$field );
562             }
563 0           my $to = $matrix->get_type_object;
564 0           my @feats = $aln->get_all_SeqFeatures();
565            
566 0           for my $seq ( @seqs ) {
567             #create datum linked to taxa
568 0           my $datum = create_bphylo_datum($seq, $taxa, \@feats, '-type_object' => $to);
569 0           $matrix->insert($datum);
570             }
571 0           return $matrix;
572             }
573             else {
574 0           $self->throw('Not a bioperl alignment!');
575             }
576             }
577              
578              
579              
580             =head2 create_bphylo_seq
581              
582             Title : create_bphylo_seq
583             Usage : my $bphylo_seq = $factory->create_bphylo_seq($bperl_seq);
584             Function: Converts a L object into Bio::Phylo::Matrices::Matrix object
585             Returns : a Bio::Phylo::Matrices::Matrix object
586             Args : Bio::Seq object
587              
588             =cut
589              
590             sub create_bphylo_seq {
591 0     0 1   my ($self, $seq, $taxa, @args) = @_;
592 0   0       my $type = $seq->alphabet || $seq->_guess_alphabet || 'dna';
593 0           $type = uc($type);
594            
595 0           my $dat = create_bphylo_datum($seq, $taxa, '-type' => $type);
596            
597             # copy seq string
598 0           my $seqstring = $seq->seq;
599 0 0 0       if ( $seqstring and $seqstring =~ /\S/ ) {
600 0           eval { $dat->set_char( $seqstring ) };
  0            
601 0 0 0       if ( $@ and UNIVERSAL::isa($@,'Bio::Phylo::Util::Exceptions::InvalidData') ) {
602 0           $self->throw("\n\nThe BioPerl sequence object contains invalid data ($seqstring)\n");
603             }
604             }
605            
606             # copy name
607 0           my $name = $seq->display_id;
608             #$dat->set_name( $name ) if defined $name;
609            
610             # copy desc
611 0           my $desc = $seq->desc;
612 0 0         $dat->set_desc( $desc ) if defined $desc;
613            
614             #get features from SeqFeatureI
615 0           for my $field ( qw(start end strand) ) {
616 0 0         $dat->$field( $seq->$field ) if $seq->can($field);
617             }
618 0           return $dat;
619             }
620              
621             =head2 create_bphylo_taxa
622              
623             Title : create_bphylo_seq
624             Usage : my $taxa = $factory->create_bphylo_taxa($bperl_obj);
625             Function: creates a taxa object from the data attached to a bioperl object
626             Returns : a Bio::Phylo::Taxa object
627             Args : L object, or L object, or L object
628              
629             =cut
630              
631             sub create_bphylo_taxa {
632 0     0 1   my $self = shift @_;
633 0           my ($obj) = @_;
634            
635             #check if tree or aln object
636 0 0 0       if ( UNIVERSAL::isa( $obj, 'Bio::Align::AlignI' ) || UNIVERSAL::isa( $obj, 'Bio::Seq')) {
    0          
637 0           return $self->_create_bphylo_matrix_taxa(@_);
638             }
639             elsif ( UNIVERSAL::isa( $obj, 'Bio::Tree::TreeI' ) ) {
640 0           return $self->_create_bphylo_tree_taxa(@_);
641             }
642             }
643              
644             sub _create_bphylo_tree_taxa {
645 0     0     my ($self, $tree) = @_;
646            
647 0           my $taxa = $fac->create_taxa();
648 0           my $taxon;
649            
650             #check if taxa exists
651 0 0         unless ($tree->has_tag('taxa_id')) {
652 0           return 0;
653             }
654            
655             #copy taxa details
656 0           $taxa->set_xml_id(($tree->get_tag_values('taxa_id'))[0]);
657 0           $taxa->set_name(($tree->get_tag_values('taxa_label'))[0]);
658            
659 0           foreach my $taxon_name ($tree->get_tag_values('taxon')) {
660            
661 0           $taxon = $fac->create_taxon(-name => $taxon_name);
662 0           $taxa->insert($taxon);
663             }
664 0           return $taxa;
665             }
666              
667             sub _create_bphylo_matrix_taxa {
668 0     0     my ($self, $aln) = @_;
669            
670 0           my $taxa = $fac->create_taxa();
671 0           my $taxon;
672 0           my @feats = $aln->get_all_SeqFeatures();
673            
674 0           foreach my $feat (@feats) {
675 0 0         if (my $taxa_id = ($feat->get_tag_values('taxa_id'))[0]) {
676 0           my $taxa_label = ($feat->get_tag_values('taxa_label'))[0];
677            
678 0 0         $taxa->set_name($taxa_label) if defined $taxa_label;
679 0 0         $taxa->set_xml_id($taxa_id) if defined $taxa_label;
680 0           my @taxa_bp = $feat->get_tag_values('taxon');
681 0           foreach my $taxon_name (@taxa_bp) {
682 0           $taxon = $fac->create_taxon(-name => $taxon_name);
683 0           $taxa->insert($taxon);
684             }
685 0           last;
686             }
687             }
688 0           return $taxa
689             }
690              
691             =head2 create_bphylo_datum
692              
693             Title : create_bphylo_datum
694             Usage : my $bphylo_datum = $factory->create_bphylo_datum($bperl_datum);
695             Function: Converts a L object into Bio::Phylo::Matrices::datum object
696             Returns : a Bio::Phylo::Matrices::datum object
697             Args : Bio::Seq object, Bio::Phylo::Taxa object,
698             [optional] arrayref to SeqFeatures,
699             [optional] key => value pairs to pass to Bio::Phylo constructor
700              
701             =cut
702              
703             sub create_bphylo_datum {
704             #mostly ripped from Bio::Phylo::Matrices::Datum::new_from_bioperl()
705 0     0 1   my ( $seq, $taxa, @args ) = @_;
706 0           my $class = 'Bio::Phylo::Matrices::Datum';
707 0           my $feats;
708             # want $seq type-check here? Allowable: is-a Bio::PrimarySeq,
709             # Bio::LocatableSeq /maj
710 0 0         if (@args % 2) { # odd
711 0           $feats = shift @args;
712 0 0         unless (ref($feats) eq 'ARRAY') {
713 0           Bio::Root::Root->throw("Third argument must be array of SeqFeatures");
714             }
715             }
716 0   0       my $type = $seq->alphabet || $seq->_guess_alphabet || 'dna';
717 0           my $self = $class->new( '-type' => $type, @args );
718             # copy seq string
719 0           my $seqstring = $seq->seq;
720 0 0 0       if ( $seqstring and $seqstring =~ /\S/ ) {
721 0           eval { $self->set_char( $seqstring ) };
  0            
722 0 0 0       if ( $@ and UNIVERSAL::isa($@,'Bio::Phylo::Util::Exceptions::InvalidData') ) {
723 0           $self->throw("\n\nThe BioPerl sequence object contains invalid data ($seqstring)\n");
724             }
725             }
726            
727             # copy name
728 0           my $name = $seq->display_id;
729 0 0         $self->set_name( $name ) if defined $name;
730 0           my $taxon;
731 0 0         my @feats = (defined $feats ? @$feats : $seq->get_all_SeqFeatures);
732             # convert taxa
733 0           foreach my $feat (@feats)
734             {
735             #get sequence id associated with taxa to compare
736 0 0         my $taxa_id = ($feat->get_tag_values('id'))[0] if $feat->has_tag('id');
737 0 0 0       if ($taxa_id && $name eq $taxa_id)
738             {
739 0           my $taxon_name;
740 0 0         if($feat->has_tag('my_taxon')) {
741 0           $taxon_name = ($feat->get_tag_values('my_taxon'))[0]
742             }
743             else {
744 0           $taxon_name = ($feat->get_tag_values('taxon'))[0];
745             }
746 0           $self->set_taxon($taxa->get_by_name($taxon_name));
747             }
748             }
749            
750             # copy desc
751 0           my $desc = $seq->desc;
752 0 0         $self->set_desc( $desc ) if defined $desc;
753              
754             # only Bio::LocatableSeq objs have these fields...
755 0           for my $field ( qw(start end strand) ) {
756 0 0         $self->$field( $seq->$field ) if $seq->can($field);
757             }
758 0           return $self;
759             }
760              
761             =head2 CREATOR
762              
763             =cut
764              
765             =head1 bioperl_create
766              
767             Title : bioperl_create
768             Usage : $bioperl_obj = $fac->bioperl_create($obj_type, $biophylo_proj);
769             Function: Create a specified bioperl object using a Bio::Phylo project
770             Args : scalar string ('aln', 'tree', 'seq') type designator
771             Bio::Phylo::Project object
772             Returns : Appropriate BioPerl object
773              
774             =cut
775              
776             sub bioperl_create {
777 0     0 0   my $self = shift;
778 0           my ($type, @args) = @_;
779 0 0         unless (grep /^type/,qw( seq aln tree )) {
780 0           $self->throw("Unrecognized type for argument 1");
781             }
782 0           my $call = 'create_bioperl_'.$type;
783 0           return $self->$call(@args);
784             }
785              
786             1;
787