# This script runs a BLAST search and saves the data within an XML document

In [13]:
# query protein sequence input
# In the example case the search is done on TEM-1 beta lactamase
from Bio import SeqIO
protein_seq = SeqIO.read("Documents/TEM-1.fasta", "fasta")

In [14]:
# double check the sequence
protein_seq.seq

Seq('HPETLVKVKDAEDQLGARVGYIELDLNSGKILESFRPEERFPMMSTFKVLLCGA...KHW')

In [15]:
# run an online blast search in the NCBI database, Homologous protein search on the
# "non-redundant protein database."
# there are many more parameter options on the home page: 
# https://biopython.org/docs/1.75/api/Bio.Blast.NCBIWWW.html

# In this example i do a search on an E-value of 0.0001 and return 10 best samples.
from Bio.Blast import NCBIWWW
result_handle = NCBIWWW.qblast("blastp", "nr", protein_seq.seq,expect=0.0001,hitlist_size=10)

In [16]:
# save the ncbi search results as an xml document
with open("Documents/TEM-database.xml", "w") as save_to:
    save_to.write(result_handle.read())
    result_handle.close()