# Verify Presence of Established Primer Pairs in a Dataset

Given the `nt` data set consisting of short sequences from well examined regions like CO1, ribosomal subunits, etc., we wish to verify if they are found by PriSeT.


In [None]:
import collections

'''
name: short string ID
name_fwd: dedicated string ID for forward primer
name_rev: dedicated string ID for reverse primer
seq_fwd: one-letter encoded DNA sequence of forward primer
seq_rev: one-letter encoded DNA sequence of forward primer
target_region: genome location for which primer was originally designed
target_group: organism group for which primer was originally designed
product_length: expected amplicon length (without primer sequences) 
ref_pub: original publication referring to this primer pair
'''
primer_pair = collections.namedtuple('primer_pair', \
                'name name_fwd name_rev seq_fwd seq_rev target_region target_group product_length ref_pub')

primer_pairs = []
primer_pairs.push_back(primer_pair._make(["DIV4", "DIV4_fw", "DIV4_rv", "GCGGTAATTCCAGCTCCAATAG", "CTCTGACAATGGAATACGAATA", NULL, "Diatoms", 329, "https://www.ncbi.nlm.nih.gov/pubmed/26052741"]))               
primer_pairs.push_back(primer_pair._make(["EUK14", "F-566cw-bio", "R-1200", "CAGCAGCCGCGGTAATTCC", "CCCGTGTTGAGTCAAATTAAGC", "18S", "Eukaryotes", NULL, NULL]))
primer_pairs.push_back(primer_pair._make(["EUK15", "TAReuk454FWD1", "TAReukREV3", "CCAGCASCYGCGGTAATTCC", "ACTTTCGTTCTTGATYRA", "18S", "Eukaryotes", NULL, "http://www.biomarks.eu/sites/default/files/pdf-refs/Stoeck%20et%20al%202010.pdf"]))
primer_pairs.push_back(primer_pair._make(["UNIV", "926mod", "1392mod", "AAACTYRAAGWGRCGG", "AAAGTCTCGTGWGTRC", "16S", "Universal", NULL, NULL]))
primer_pairs.push_back(primer_pair._make(["23S", "A23SrVF1", "A23SrVR1", "GGACARAAAGACCCTATG", "AGATCAGCCTGTTATCC", NULL, NULL, 400, "https://peerj.com/articles/2115/"]))
primer_pairs.push_back(primer_pair._make(["COI", "LCO1490", "COI_230_R", "GGTCAACAAATCATAAAGATATTGG", "CTTATRTTRTTTATICGIGGRAAIGC", "23S", NULL, 230, "https://pdfs.semanticscholar.org/943d/38b9d96f8222e883604822bcafb7930ca6da.pdf"]))
primer_pairs.push_back(primer_pair._make(["nSSU", "SU_FO4 nSSU", "SSU_R22 nSSU", "GCTTGTCTCAAAGATTAAGCC", "GCCTGCTGCCTTCCTTGGA", "18S", "multiple metazoan phyla", NULL, "https://www.nature.com/articles/ncomms1095"]))
primer_pairs.push_back(primer_pair._make(["V9", "V9_18S_fw", "V9_18S_rv", "GTACACACCGCCCGTC", "TGATCCTTCTGCAGGTTCACCTAC", "18S", "zooplankton", NULL, NULL]))

one_letter_codes = {'R': '', 'I': '', 'Y': ''}