# Translating RNA into Protein

The 20 commonly occurring amino acids are abbreviated by using 20 letters from the English alphabet (all letters except for B, J, O, U, X, and Z).

UUU F      CUU L      AUU I      GUU V
UUC F      CUC L      AUC I      GUC V
UUA L      CUA L      AUA I      GUA V
UUG L      CUG L      AUG M      GUG V
UCU S      CCU P      ACU T      GCU A
UCC S      CCC P      ACC T      GCC A
UCA S      CCA P      ACA T      GCA A
UCG S      CCG P      ACG T      GCG A
UAU Y      CAU H      AAU N      GAU D
UAC Y      CAC H      AAC N      GAC D
UAA Stop   CAA Q      AAA K      GAA E
UAG Stop   CAG Q      AAG K      GAG E
UGU C      CGU R      AGU S      GGU G
UGC C      CGC R      AGC S      GGC G
UGA Stop   CGA R      AGA R      GGA G
UGG W      CGG R      AGG R      GGG G 

In [1]:
rna_codon_table = {
    'A': ['GCU', 'GCC', 'GCA', 'GCG'],
    'C': ['UGU', 'UGC'],
    'D': ['GAU', 'GAC'],
    'E': ['GAA', 'GAG'],
    'F': ['UUU', 'UUC'],
    'G': ['GGU', 'GGC', 'GGA', 'GGG'],
    'H': ['CAU', 'CAC'],
    'I': ['AUU', 'AUC', 'AUA'],
    'K': ['AAA', 'AAG'],
    'L': ['CUU', 'CUC', 'CUA', 'CUG', 'UUA', 'UUG'],
    'M': ['AUG'],
    'N': ['AAU', 'AAC'],
    'P': ['CCU', 'CCC', 'CCA', 'CCG'],
    'Q': ['CAA', 'CAG'],
    'R': ['CGU', 'CGC', 'CGA', 'CGG', 'AGA', 'AGG'],
    'S': ['UCU', 'UCC', 'UCA', 'UCG', 'AGU', 'AGC'],
    'T': ['ACU', 'ACC', 'ACA', 'ACG'],
    'V': ['GUU', 'GUC', 'GUA', 'GUG'],
    'W': ['UGG'],
    'Y': ['UAU', 'UAC'],
    'STOP': ['UAA', 'UAG', 'UGA']
}

In [2]:
codons = open("codons.txt", "r").read().split("\n")
rna_codon_list = {i.split(" ")[0]:i.split(" ")[1] for i in codons}
rna_codon_list

{'UUU': 'F',
 'CUU': 'L',
 'AUU': 'I',
 'GUU': 'V',
 'UUC': 'F',
 'CUC': 'L',
 'AUC': 'I',
 'GUC': 'V',
 'UUA': 'L',
 'CUA': 'L',
 'AUA': 'I',
 'GUA': 'V',
 'UUG': 'L',
 'CUG': 'L',
 'AUG': 'M',
 'GUG': 'V',
 'UCU': 'S',
 'CCU': 'P',
 'ACU': 'T',
 'GCU': 'A',
 'UCC': 'S',
 'CCC': 'P',
 'ACC': 'T',
 'GCC': 'A',
 'UCA': 'S',
 'CCA': 'P',
 'ACA': 'T',
 'GCA': 'A',
 'UCG': 'S',
 'CCG': 'P',
 'ACG': 'T',
 'GCG': 'A',
 'UAU': 'Y',
 'CAU': 'H',
 'AAU': 'N',
 'GAU': 'D',
 'UAC': 'Y',
 'CAC': 'H',
 'AAC': 'N',
 'GAC': 'D',
 'UAA': 'Stop',
 'CAA': 'Q',
 'AAA': 'K',
 'GAA': 'E',
 'UAG': 'Stop',
 'CAG': 'Q',
 'AAG': 'K',
 'GAG': 'E',
 'UGU': 'C',
 'CGU': 'R',
 'AGU': 'S',
 'GGU': 'G',
 'UGC': 'C',
 'CGC': 'R',
 'AGC': 'S',
 'GGC': 'G',
 'UGA': 'Stop',
 'CGA': 'R',
 'AGA': 'R',
 'GGA': 'G',
 'UGG': 'W',
 'CGG': 'R',
 'AGG': 'R',
 'GGG': 'G'}

In [76]:
sample = "AUGGCCAUGGCGCCCAGAACUGAGAUCAAUAGUACCCGUAUUAACGGGUGA"

In [88]:
def trans_prot(sample):
    codon_list = [sample[i*3-3:i*3] for i in range(1, int(len(sample)/3)+1)]
    return "".join([rna_codon_list[i] for i in codon_list if rna_codon_list[i] != "Stop"])

In [89]:
trans_prot(sample)

'MAMAPRTEINSTRING'

In [90]:
test = "AUGCUGCCUAUGUCUGCAAAAUUUGUGAAUCUGUCAAGCGACACUCUGGCGCCUGUUACCCUCAUGCCGCGUUGGGCUGCAGCAACACAAUCCGUGAUCAAGCGCAGCCCUGUUAGGUACACCGGCAUAUUACUACCAGGUCCGUUUUACGACACGAACGGCUUCGUGCGUAGUCGACGCGCCUCAGUGGACAGAGGAAUUGGUACCUUUUCGCCCUUUGGUGACCUUUACCACCAAUGCGUUGGUACCGAAUUCAAUGUUUGCCAAAGGUUUGAGCAAGGAGGAUCUCUAGAUCCACACAACCCUUUGAAUUUAUUCACAGACCAGAAUAUUCGCAGGAUUACACACCUGCGAUCAUGUCUCUACGAGUCCGAUAUUAGGGAACUGUACUUCAGAUCUUAUAACGUAGACAAGAAUAUUGCUACAAAAGUCCGUGGGGGAGGUAUACCAGAGAUACUCUAUAGACUCCCGUCAGGCAGACGAUUGUUUGGCGAGGUGCGUAAUUUCCACCAGCCAUUAAGCCCCCUUGCUAUGACAUUGAGGAAUACCUCGGCCCCAGUUAGUGCAAUUCAUCAAGAGCGCGACGUGUUUGACACCGAAAUCUCCGCGCUUCACUCCGCCAAACGUGUGGGCGUUUAUAUGUUCGUCCAUUAUCACCAGUUUGUCGUCACCCCGACUACGAACACAACGAGUGCUUGGCCGGGAGAAAACCUUAAAGGAAUUCAGGUGUAUAUUCCUGACUUAAACAGCCCGUUCUUAGUAUUCUAUUUCAUUCUUCUUGAUCUAGUCGUCAAGUCGAGCAGUUCCAAGCAGCCCAGUGGUGGAACCGCGUAUAGAGUCACAAAACACACACAGGGAAUGAAGCACACUGGUUCUUCGGCUUGCAGGAUCCGUAUCGCCCUGCCCAGCUUUAAUCGAUAUAUUUUCGAUCUGAUUCAAGGGAACCAUGCUCGCGCGCAGCAUUCGACGGUGGAUCGGAUGGGGUCAGAUUGUUCCCCACCAUACGCUACUCAUAUGACGACUUGCGGUAUACCACCAGAGACGGGGCUGCGGCUCAGCGCCCCAAAAGAAAACAACCGUCUUUUAGCUCCAGACCCCCGUUUAACACAAAAACGCGUGGGUGAUAAGUACACCAGCAAAGCUACAGUAUUCGCCGCACGCCUAUCGACUUUUAGCCCUAUAAUCAAAAUGAUGCACCUUAUUAGAUUGAAGCAGCUUUCUGCCGAGCGACAGUGCACCUUAUCAAGUCCCGUCGGGGUGCUUUGCUUACUGCACCGUGAUCUCAGUCGGAAAGCUAGUGUCGCGAGCUAUCGUUGCUGCCCACCCGACGUUCAACCAUUGAAACGUUCAAAAACGACGUGCGAACGUACAUCCGUUCUCGGACGCAAGACAGGAAGAGGCGAAGAGGGUUACUAUCACAUUGAACUAGCGAGUCGCUGCUCUCCGACCAACGCGCCUGUAGGGGACGGAGAAUGCGCGCCAAGACAAUUCCGGGUAGCCUCACGGGCGACGGUGCCGUCACUUAGACGCCUUGUAGACAUCCCGGGGAACGUGAAUUGUUUGGAUAAUUUUCAGUCGGGGGCACUCUAUGCCAAGAAACGCGUUGUAGGUCCUGAAAGGACAUUUCGUCGCACAGACAAAUUUACAUCCUUACCCAUUUACGGGAUCCAGUUGGAGUUCGAAACUCAAGUCCCGGGCAUAUUUUGUUUUGUUCUCGGUCUGAAGGCCAGUGUCCUGAGACGUGUGCUUUCCUACGCUGAAAAGCUCUCGCUGUCAGGGCGAUCAGUGAGAUGUGCGCGGGUAACAGGAUGUAUAUGGCUGCUCCGAACGGCUUGUUGUACCCGAUCGCUCCAUGCUCAUGGCAGACAUAGUGUGUUAAUAAACUACGCAAUUCACCACUUCUACUUCUUACCCUUUCCCAUCCGAGGAAACGCAAGUCAGCUCGAGUCUGGGCUCCAUUGUAAGACGAGCGUUAUUCAAAACUUGCCCCCUGUGAGUAUGCUGUCACAUAGUGUGGUCGUCCCUACGUAUGGAUAUGUAUCUUUCGCACAUCCUAAAGUCCCGGACCGUAAACCUAAUAUAACCGCUUCUAGUGGUUAUUCUUUUUGGCAGAUCGUUUUAUACGUUGAGCGUCGAUCCGAAGGGCUUGAGCGUCGCACAUGCCUAGCAGAUGAAAACCUCGCUCCAUGGCCUCGUACAUCAUCAGCUCAAUCGACGGCGGGGACCAUACAGGUACAAUUAUUACCGGCUGAAUUCAUAGGGGGUGGAUUGCUUUAUAUCAGGGAAAAGUCUCUGCUGUCCAGGGAGCGCCCGUCUGCUCCAGAACUACCCCGGGCGCGGUCUCUGUGCAAACAUACUACUGGUGCAUGUUUGAACGGACGCAGAAGUGAAUUACACGUAGUAGAUGCAAGUCACCCGGGGAGCUACCGGCAAGGGUAUUCCGUUCAGAUGAAUGAAAAAUCUGCAGCUGAGCUCAUUAGACAUCUCUACCCCCACGACAGGCAGAUAUCUGUUUUCCCGUGCCCGACUGGGACUUCUACAGGUGUCCGUAAGCUGUGUCAGGCUGCCGUGUCAGAUGUAAGCGUCGGGGACAUUGCCAACUUACAAACGGGGCUCCGACCUUACUCAUGUGUAGCAUUUAAACCAUGUUUAACUCGUCCAAAGACAUUCAAAACCUGGCCCGUCACUCUGGCGAAAUGCACCCGUUUAGAUGCGCGGUUCGCUGGUUUGGUCACGACAAUAGUAGGUCAAAGCUACGGUGAAUUUAUUUUCAUCGGAGAAACGCAAUGCUUAUCUAGAACUAAUAAAUAUCAAAAUUUCAUCAAGAUGCGAGGGGACAUUAAGCCCCUUAGGCUAUUUUGGACCCCAAUCGCCUGGGUAGCCAUUCCGAACCGGGACCGCAUUUAUUCCAAUGCAAAUCUCGUUUGGGUUGGUGGGCGCUCCAGCCCCGUAAGUUUCAUCCCGUGUCAGGGUUGUUCAGGCCUUGCGUGCCCAGCAUUUCAUUCCAGGGAUAAGCGGGUACACGACGAGGCGUGGCGGCUAGUGGACCAUCUCCAUAGCUUAGAGCUAGGGGCUCCCUAUCGAAUAUGGGUGCGUAUAUUUGGACGGUGUGGUUAUGGCCGUAUGUGCGAGCUAGAGACGGUGAAGGUUUCGGAAAACGCCACCAUGUGGCCGAGGCACGGGGUCUGUCCCCAGCAAGGGAAAUUAGCGCUAUCUAGAGCCGCGUCAAGGAACUUAGCGCGGGGGAUAAAGCACGUUCAGAUGGUCAGGACUUACCAAACGGUGAGUGUGGCGCCGUCACUCUCCUUUAAUGCCGUAGGCGACGCCAAACUGCGAUCUGGGGCGGUUCCUCAAACACUCGUGUAUUUCCGAGGUAAAUGUCCAAAUGAUACCGGAUGGUCUUCGUUAAUUCAUCCUGGUCGGGAUUUCCUUGUGGGCAGGACGCAUCCGUCGCAGGCCAUUAUCGUAAUACCUACGAUGUUCGGAUUAGAAUUUGGUACUACUGAAACCUCCCCGCCUAUCACGGAUAGGCUAGCUCUCACUAUCCCGGAGAGUGGGGUGGUCGUGGAAAGGCGAGAGUCUAAUCUAUGCGGAAAAACGGCUACAGUAGUGCGGUCGUAUAGACAUAGCUCACAAAUUGAUCCCAUUUGGCCACCACAGAGCCUGGAACAAUACGCUGGUGCCGGUUAUGAAGGUCCAGUCCGAGGGAAGUACCGCACAACGCGAAAGAAGACUGCUUUCGCUUGUGCUUUGGGGAAGUACGCGCAUCUACAUAGCAAUUCCACAUGCCUAUCUGGCCAUAAUCGCCGUGGCUGCACUGUGCUGCGGGAAGAGUCCCCUUGUUACGGACUUAAAUCACCCUACUCCGAUCUGGACACUUUUCAAUGGGCUAAUCUUAUCUCUCGUGCGCUUGUGGGGGCCGUACAUAAGACGUUCUGCGUUGCAGGAUACGACAUUUAUGACACCCAAGUACGGAAAACGCGACUAAAAAGCUACCUGGGCGGCCCAAAUAACUCGCCGCGAAGCAACCGCGAGCGACUGCACCACUCGGAAAGAUUUUGGCGAUGUCCAAAUUCUGUAUCCCGCCUAGCCUGUUCCUGCUCUCGCCAGGCCUCGGUGGAAAAGAUCCCAUUGGGUUACAGAACGACAUUCCCAAUAUUAUCCUCAGGUGUCAAUCAUUUUGAGGGAUCGGCGUAUGAGUUCUGGCGAAAACACGUCGAGGAAUUGGGUCAAGGCGGGCGGACACUGAGGUCCCAUGAGCUAGCAGAUCUACCCUUUGACUGUGCACGGAGGGCAAUUAGUGACAAUUUGCUGAGGACUUUAGGGUUUCAGGAAUGGAACUCCAUAAGUGCACCUCUAUAUGUAUGUGGUUACACCAGGUUACUUCACUGUUGGAGAGCACUUCGUAAUGGGCGGACCGACUGCUUUCAUUAUAGCUUGCGCUUCUUAUCACAGAUAAACACCACUAUCAGCUCUAACCACUUGCAUCGGCCGCGAGUAAGGCCUCAGCGAACAAAAACGUGCUAUCUUCACGGAGGACCUGGCCGGCUUAGCCCGAGGCGUAGUUGCUCUAGCACUCCCAUUCCGUCCGAAGGAUGUACUGCUAAGCUUCUCGAUAAAGCGGCGGACGGGGCGAGACUUGCACGUACCUACGGGAUUUCUCCUCCCGUAGAAAACUCUGCCGUAUGUUGUCCGUAUGAACCAGGUGCAAGGAGUCCGCAGAGUUCGAUGGGUGGACCGGUCGUUGUAGACUAUUUACUGUCAUAUAUAACGGUUUGUGUCACUUCCUCGUUCAUGCCUACUGUACGGCCCUCAUCACUGGCUCCCAAACUUGAUCGCUCAUUUGUAGGUAUUAAUAGGGCUGUUUUACCGGCGACAAACGAAUCAAUCGAUUCCGAAAGAGUAAACGGCGCGCGAAAAUGCAACAGGGGACGACUCGUCGAAGACGGUAUUUGUCCGAUUACGACACGGAUAAGGACUCCCGCCACCCAUGGCAAGCUUUAUAUACCACCAGAUCAGGCGAACCUUGAAAACGUCACGAUCAAUACAUCGCGCGAGCAUGUCGGACUCAGUAUCUAUGUUCUAGAUAGAAUGGGUAAUGGGGUUACUGCUGUCUACGUACUACUACAUUAUUUGAUUGUCCCUUCCUUCGGAGGGGCUCUUCAUAAGAUUGCGGCGGCUUCGCCCAUGAAAAUCUGCGCGCGUGCAAGCAUAAACACACAAGUGAUCUUUGAGGGCGCGGUUAGACACCGCUGUGCCCAGGAUUUGGCCGUGUUUCGCAAACGAAUAAUGAUGCUAUUGAUCUCUAGGGUUGAAUGGACAGUAGUUCGGAGACAAGGAAUAGCGUGUGACCUAGAGUACUAUAAGUCCCAAGUGCCAGCGGGCAGCGCUACCAAAACAACCGAUAGGCUGUGCGAAGUUAGUUGCAACACUGCACCAGCGGGUAACGACCGUAAACCGCAGCUACUAUAUUAUGAUCCCGUUUGGGGUCUGCUUCGUGGCGCGCUCUAUGUCCCCGUUGCUCGAGAGCAAGACCAGGUAAGAGGCCUGCUGUUGGAGCAUUACCGAUCCCCGUUCGUCCCCGGGAAAAUUACCUCCACACUCCGCGGUAAUCCAUAUGUGGUUAGCAAAUUCAGCUCUCACAGCCCGCGGAAGGUGACUUGGCCUCCUAAUUGGCAACAUCGAACCCGUCGCUGGCAAACCUGGGGUCUACUCACAGGUGGCCAUAUAGAGCUUCCUGAAGGCAGUUCGUGGGGGGUGUUCGGCACGCCCGAUUUCAAGUCGCUUCGGACAGUGUCACCAGACAGUCGUACAACUUGCGGUGGUGCGCAGUACGUCAUUACAGCUAGAAGGUCACGGGGCUCAGGACCGUUCCCGUCCGUAAUUCUGAGCAAAAGCUGCGGUUGGUCAACUGAAGUAAUGUCGUUUGUUUGUAUGGAAAAAAAGCGCUGCUUCCCUAAGGCACUACUUAGCAUGAGCUACUCAUGGGGGCAGUCCGCCGUAGAUAACACGGAAAGCCUACCAAGAGCGCAGACCCGUAGAUAUUGUAAGGGCUCGGACUUACAGCUCGAGACUCGGGACCUACUUCAACAGAUCUCUGAUUCCGACCUGGGGAGCGUGAAUUGCCAUCAUGUACAAGAUACCCUUACCUCUUCAACCCUGGUCGCGUUUUUCUCGCGGUUAAGUAAGCUUAGGCCGUCAGGUACCGCCGCAUACAGAAAUAGUAGCUACGAAUGUGCCACUACCCGACUAAGCACGCGUUUAUCCCUGCUUGCUCAUCGGGCGAUUGCAUCAAAACGCCGUGCUACCAUCUCUCUAGUGUGGAAAACAAGCCUGUGGAAUUCAGAUGUAGUGUCAAGACUGGGGCACGUACUAUUCGCCCUGAAGUCUGUAUAUAAGGUCUCUGAACCAGCCCAUAGAGAGGACUCCGCAAGGGGCUCGAUUAUAUCGGCGCACGCGGAUUUCCCCAAUCAUCCACUUUUUGUUAUUACGCUCGUCUUUCUGCCGUGCAUGCUUUGGGCCGCGAUUCAGCCGUCCGAUGAACCACCGGCGAUACAAGGGAGUCCGCAGUGGGCGGAUAGACACCAAGCCUUAAGCAUAGACAGAGACAAAAUCUUACGAAACACUUGCCCUCCGACGCCAAUCUCUCCGCUACUCUGCAGAUCCAAUCCAUGUCACCCGGUUUUUUUUCAGAGGGCGUCGACAGUGAAGGCACGCUUUUACAUUUUGCAGAAUAUACCAAAUCAUCGAUUUACGAUGGUCUUAAUCGAGACCUGCCUAAAGCUGGUGUGGUUUAGCGCACUCUUGAAGAGGCAGAGGGCAGUUUGUGUCAUGUGUACUAGGACGCCCCCCUGUGUGCCAGCUCUAUCCGAACCAUCUCCCCCUGGGAGCUGUGAGAGCGGGGCUGCCCGGAACACGAACUUCACAGUGCGACGUCGACUGCAACAAAUAGUGGCGCUAGCACUGCAUUCCCCACUGCUGGUGUCACAAGAGUACUGCGACAUUUUUACAGACGUUUGGCUCUCUCGCAGAUGCACCCUGCAUUGGUUUUUCCCGAUCAGAGGGCAUGGUGACACUAAUGGCCCCGGGUCGUCCGAUGGGCUUGUUCCAGUAACUAAGAUCGAACUUGGCGGAUCACCUUCGCGCGUGGGUCGUCGAUCUCAUGGUCAUCUAAAUAUCGCAGAACCAUGUAAGGCGGACUACAAUGGGUUUGCUCAAUCCAUGAUAUUGGGAUUAUAUGAAACUAAGUCGUUCACUGUUGUUCUUAGUCGUUUUGCGAUUUUCGUGGUGUUUUUCCAAUGUCGGUUUCAAAUCACCCUUAUUAUUGGGCAAACCAAAUUGAACAUCUGCAAGGCAGGCCAUCCGAGUGCACAUUCGGCAGCCUGGAGGUGGUUAUCACGCCUCGAAGAGUACUGCUACUUGCCAACCAAGCGGCUGCUCAUUCAGGGCUCGCUGCGACAGCAGCUAACUAAACCUACAGCGAAGGAGAAUGUCCUUCACCGGUUAAUGGAAGCACCCAAGCGGAUAUACGAUAUUCAUGUGGCACUAAGAAUUGUUACAAUGAAGUUAGGACUCCGCAACGGUUCCGCAUCAGUAGUCAAUGAUCUAGAACUAGCUGUGACGUGUUGGCGCCCGACGAUGGGAUUGAUGUCUGCUCGAAGGCACCAAUCGGCUGUACGCACUCUUACUGCGCUACCCGGGUUAUGGCCAGGCGGCAAAUCGUAUUAUCAGUACAGGGCGCCCUUGCAGUGGGUUCUAAGUUAUGUUGUGGGCUACCUAGAUUGUACCCUUGGUACAGUACGCGCUUGUAUCACUACAACACUGGCUAGACUAGAAUAUCUCGGACCGCGUACCAGGCUGGCGAAUGGGACGCAAACGAGAAUCAGGAGAAGACCCCGCCGUAAUCGAAAGGGGGUGACCUCUCCCAGUUAUGAGCGUCUCUGUAUUAACAUUAUUCCAGGGUGUAGACACGGCAAGAUCGCUCCAGGUUCCGCCGACCGCCCCAGUAACCCGCGCUUCCAUAGAGCGGGCUUCAUAGGUCCAAACCACUCCAGUCCCGCCCAGAAAUCUGUAUCUAACCGAAACGGGGUCCGCGGGUAUAUUCUGCAGAUCGCUGGCGGUCGCAACAGACGUCUUACGCUUGACCGUCUCGCGCGAGGGUCAAGACUGUUGGGCCUGCGGCUCGCACGAGAACCCCGAAUCGGCCGGUUUAUCAAAAAUCGGAGAUGCAUGCCUCUAUGUGCUACGAUUCAGAGUUGGUGCACAGAGCAAGGCCUUGUGGCAUACCCUUACCAUUGCUUCAUGCCUAACAUUGCGAAUUACGACCUAUUUGCACGUUCUCAGCAUAAUCCAAUGACGCUAUCAGCUUUUAGUCUUCGAUCUUAA"

In [91]:
trans_prot(test)

'MLPMSAKFVNLSSDTLAPVTLMPRWAAATQSVIKRSPVRYTGILLPGPFYDTNGFVRSRRASVDRGIGTFSPFGDLYHQCVGTEFNVCQRFEQGGSLDPHNPLNLFTDQNIRRITHLRSCLYESDIRELYFRSYNVDKNIATKVRGGGIPEILYRLPSGRRLFGEVRNFHQPLSPLAMTLRNTSAPVSAIHQERDVFDTEISALHSAKRVGVYMFVHYHQFVVTPTTNTTSAWPGENLKGIQVYIPDLNSPFLVFYFILLDLVVKSSSSKQPSGGTAYRVTKHTQGMKHTGSSACRIRIALPSFNRYIFDLIQGNHARAQHSTVDRMGSDCSPPYATHMTTCGIPPETGLRLSAPKENNRLLAPDPRLTQKRVGDKYTSKATVFAARLSTFSPIIKMMHLIRLKQLSAERQCTLSSPVGVLCLLHRDLSRKASVASYRCCPPDVQPLKRSKTTCERTSVLGRKTGRGEEGYYHIELASRCSPTNAPVGDGECAPRQFRVASRATVPSLRRLVDIPGNVNCLDNFQSGALYAKKRVVGPERTFRRTDKFTSLPIYGIQLEFETQVPGIFCFVLGLKASVLRRVLSYAEKLSLSGRSVRCARVTGCIWLLRTACCTRSLHAHGRHSVLINYAIHHFYFLPFPIRGNASQLESGLHCKTSVIQNLPPVSMLSHSVVVPTYGYVSFAHPKVPDRKPNITASSGYSFWQIVLYVERRSEGLERRTCLADENLAPWPRTSSAQSTAGTIQVQLLPAEFIGGGLLYIREKSLLSRERPSAPELPRARSLCKHTTGACLNGRRSELHVVDASHPGSYRQGYSVQMNEKSAAELIRHLYPHDRQISVFPCPTGTSTGVRKLCQAAVSDVSVGDIANLQTGLRPYSCVAFKPCLTRPKTFKTWPVTLAKCTRLDARFAGLVTTIVGQSYGEFIFIGETQCLSRTNKYQNFIKMRGDIKPLRLFWTPIAWVAIPNRDRIYSNANLVWVGGRSSPVSFIPCQGCSGLACPA