aakash0017's picture
Upload folder using huggingface_hub
b7731cd
# Copyright (C) 2009 by Eric Talevich ([email protected])
#
# This file is part of the Biopython distribution and governed by your
# choice of the "Biopython License Agreement" or the "BSD 3-Clause License".
# Please see the LICENSE file that should have been included as part of this
# package.
"""I/O function wrappers for ``Bio.Nexus`` trees."""
from itertools import chain
from Bio.Nexus import Nexus
from Bio.Phylo import Newick, NewickIO
# Structure of a Nexus tree-only file
NEX_TEMPLATE = """\
#NEXUS
Begin Taxa;
Dimensions NTax=%(count)d;
TaxLabels %(labels)s;
End;
Begin Trees;
%(trees)s
End;
"""
# 'index' starts from 1; 'tree' is the Newick tree string
TREE_TEMPLATE = "Tree tree%(index)d=%(tree)s"
def parse(handle):
"""Parse the trees in a Nexus file.
Uses the old Nexus.Trees parser to extract the trees, converts them back to
plain Newick trees, and feeds those strings through the new Newick parser.
This way we don't have to modify the Nexus module yet. (Perhaps we'll
eventually change Nexus to use the new NewickIO parser directly.)
"""
nex = Nexus.Nexus(handle)
# NB: Once Nexus.Trees is modified to use Tree.Newick objects, do this:
# return iter(nex.trees)
# Until then, convert the Nexus.Trees.Tree object hierarchy:
def node2clade(nxtree, node):
subclades = [node2clade(nxtree, nxtree.node(n)) for n in node.succ]
return Newick.Clade(
branch_length=node.data.branchlength,
name=node.data.taxon,
clades=subclades,
confidence=node.data.support,
comment=node.data.comment,
)
for nxtree in nex.trees:
newroot = node2clade(nxtree, nxtree.node(nxtree.root))
yield Newick.Tree(
root=newroot, rooted=nxtree.rooted, name=nxtree.name, weight=nxtree.weight
)
def write(obj, handle, **kwargs):
"""Write a new Nexus file containing the given trees.
Uses a simple Nexus template and the NewickIO writer to serialize just the
trees and minimal supporting info needed for a valid Nexus file.
"""
trees = list(obj)
writer = NewickIO.Writer(trees)
nexus_trees = [
TREE_TEMPLATE % {"index": idx + 1, "tree": nwk}
for idx, nwk in enumerate(
writer.to_strings(plain=False, plain_newick=True, **kwargs)
)
]
tax_labels = [str(x.name) for x in chain(*(t.get_terminals() for t in trees))]
text = NEX_TEMPLATE % {
"count": len(tax_labels),
"labels": " ".join(tax_labels),
"trees": "\n".join(nexus_trees),
}
handle.write(text)
return len(nexus_trees)