import os.path, subprocess
from Bio import Phylo, AlignIO
from Bio.Align import MultipleSeqAlignment
def build_msa(node, sequence_msa_map):
key = str(node.__hash__())
file_name = key + '.msa'
file_handle = open(file_name, 'w')
terminals = node.get_terminals()
alignments = [sequence_msa_map[] for terminal in
alignments = MultipleSeqAlignment(alignments)
AlignIO.write(alignments, file_handle, 'stockholm')
return file_name
def build_hmm(msa_file_name):
file_prefix = os.path.splitext(msa_file_name)[0]
hmm_file_name = ''.join([file_prefix, '.hmm'])
process_name = "hmmbuild %s %s" % (hmm_file_name, msa_file_name)
process = subprocess.Popen(process_name, shell = True)
return hmm_file_name
def treewalker(root, sequence_msa_map):
msa_file_name = build_msa(root, sequence_msa_map)
hmm_file_name = build_hmm(msa_file_name)
if not root.clades:
for clade in root.clades:
treewalker(clade, sequence_msa_map)
def main():
tree_file = ""
msa_file = "sample_alignment.msa"
new_sequence_file = "new_sequence.fasta"
# Note: the name of the tree leaf nodes is going to be the
# same as the id of each msa entry
tree =, "newick")
msa =, "fasta")
sequence_msa_map = {}
for entry in msa:
sequence_msa_map[] = entry
treewalker(tree.root, sequence_msa_map)
if __name__ == '__main__':