### Download the 4 ribosomal rRNA sequences from NCBI

 * 28S - NR_003287.2
 * 18S - NR_003286.2
 * 5.8S - NR_003285.2
 * 5S - NR_023363.1

#### Globals

In [7]:
from Bio import Entrez
from Bio import SeqIO

Entrez.email = 'rasi1983@gmail.com'

refseqids = {'28S' : 'NR_003287.2',
             '18S' : 'NR_003286.2',
             '5.8S' : 'NR_003285.2',
             '5S' : 'NR_023363.1',
            }

#### Fetch rRNA sequences from NCBI and Write to Fasta

In [12]:
outputlist = []
for (name,ID) in refseqids.items():
    # identify ids by searching
    rec = Entrez.read(Entrez.esearch(db="nucleotide", term=ID))
    # retrieve full record for the found id
    handle = Entrez.efetch(db="nucleotide", id=rec["IdList"][0], rettype="fasta")
    output = SeqIO.read(handle, 'fasta')
    # clean up record to be minimalistic
    output.id = ID
    output.description = output.name = ''
    outputlist.append(output)
    
SeqIO.write(outputlist, '../data/reference_sequences/hg38.rrna.fasta', 'fasta')