# Protein Synthesis

-Protein Synthesis is how cells make proteins using 2 stages
- Transcription
- Translation

In [2]:
from Bio.Seq import Seq

In [3]:
dna_seq = Seq('ATGATCTCGTAA')

In [4]:
len(dna_seq)

12

In [None]:
# A T = 2 hydrogen bonds
# G C = 3 hydrogen bonds
# usually more GC content means more heat stable

In [6]:
dna_seq


Seq('ATGATCTCGTAA')

In [5]:
# Complement
dna_seq.complement()

Seq('TACTAGAGCATT')

In [7]:
# Reverse complement
dna_seq.reverse_complement()

Seq('TTACGAGATCAT')

In [9]:
# Custom 
dna_seq.complement()[::-1]

Seq('TTACGAGATCAT')

## Protein Synthesis

In [11]:
dna_seq

Seq('ATGATCTCGTAA')

In [10]:
#Transcription
# DNA to mRNA
# Writing a message

dna_seq.transcribe()


Seq('AUGAUCUCGUAA')

In [13]:
mRNA = dna_seq.transcribe()

In [14]:
# Translation
# mRNA to a protein/amino acid
#Method 1
mRNA.translate()
# an * indicates a stop codon

Seq('MIS*')

In [15]:
#Method 2
# Direct translation of DNA to an amino acid
dna_seq.translate()

Seq('MIS*')

In [16]:
# Create a custom stop codon symbol
mRNA.translate(stop_symbol= "@")


Seq('MIS@')

In [17]:
# Back transcription

# Convert mRNA to DNA

mRNA.back_transcribe()

Seq('ATGATCTCGTAA')

In [18]:
mRNA.back_transcribe() == dna_seq

True

In [20]:
# Join the steps 
dna_seq.transcribe().translate()

Seq('MIS*')

In [21]:
# Convert an amino acid to 3 letters
from Bio.SeqUtils import seq3,seq1


In [22]:
aa = dna_seq.translate()

In [23]:
aa

Seq('MIS*')

In [24]:
seq3(aa)

'MetIleSerTer'

In [26]:
#Convert from 3 letters to 1

seq1('MetIleSerTer')


'MIS*'

In [27]:
# View our codon table
from Bio.Data import CodonTable

In [28]:
#Methods
dir(CodonTable)

['AmbiguousCodonTable',
 'AmbiguousForwardTable',
 'CodonTable',
 'IUPACData',
 'NCBICodonTable',
 'NCBICodonTableDNA',
 'NCBICodonTableRNA',
 'TranslationError',
 '__builtins__',
 '__cached__',
 '__doc__',
 '__file__',
 '__loader__',
 '__name__',
 '__package__',
 '__spec__',
 'ambiguous_dna_by_id',
 'ambiguous_dna_by_name',
 'ambiguous_generic_by_id',
 'ambiguous_generic_by_name',
 'ambiguous_rna_by_id',
 'ambiguous_rna_by_name',
 'generic_by_id',
 'generic_by_name',
 'list_ambiguous_codons',
 'list_possible_proteins',
 'make_back_table',
 'register_ncbi_table',
 'standard_dna_table',
 'standard_rna_table',
 'unambiguous_dna_by_id',
 'unambiguous_dna_by_name',
 'unambiguous_rna_by_id',
 'unambiguous_rna_by_name']

In [31]:
#DNA table
print(CodonTable.unambiguous_dna_by_name['Standard'])

Table 1 Standard, SGC0

  |  T      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
T | TTT F   | TCT S   | TAT Y   | TGT C   | T
T | TTC F   | TCC S   | TAC Y   | TGC C   | C
T | TTA L   | TCA S   | TAA Stop| TGA Stop| A
T | TTG L(s)| TCG S   | TAG Stop| TGG W   | G
--+---------+---------+---------+---------+--
C | CTT L   | CCT P   | CAT H   | CGT R   | T
C | CTC L   | CCC P   | CAC H   | CGC R   | C
C | CTA L   | CCA P   | CAA Q   | CGA R   | A
C | CTG L(s)| CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | ATT I   | ACT T   | AAT N   | AGT S   | T
A | ATC I   | ACC T   | AAC N   | AGC S   | C
A | ATA I   | ACA T   | AAA K   | AGA R   | A
A | ATG M(s)| ACG T   | AAG K   | AGG R   | G
--+---------+---------+---------+---------+--
G | GTT V   | GCT A   | GAT D   | GGT G   | T
G | GTC V   | GCC A   | GAC D   | GGC G   | C
G | GTA V   | GCA A   | GAA E   | GGA G   | A
G | GTG V   | GCG A   | GAG E   | GGG G   | G
--+---------

In [32]:
#RNA table
print(CodonTable.unambiguous_rna_by_name['Standard'])

Table 1 Standard, SGC0

  |  U      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
U | UUU F   | UCU S   | UAU Y   | UGU C   | U
U | UUC F   | UCC S   | UAC Y   | UGC C   | C
U | UUA L   | UCA S   | UAA Stop| UGA Stop| A
U | UUG L(s)| UCG S   | UAG Stop| UGG W   | G
--+---------+---------+---------+---------+--
C | CUU L   | CCU P   | CAU H   | CGU R   | U
C | CUC L   | CCC P   | CAC H   | CGC R   | C
C | CUA L   | CCA P   | CAA Q   | CGA R   | A
C | CUG L(s)| CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | AUU I   | ACU T   | AAU N   | AGU S   | U
A | AUC I   | ACC T   | AAC N   | AGC S   | C
A | AUA I   | ACA T   | AAA K   | AGA R   | A
A | AUG M(s)| ACG T   | AAG K   | AGG R   | G
--+---------+---------+---------+---------+--
G | GUU V   | GCU A   | GAU D   | GGU G   | U
G | GUC V   | GCC A   | GAC D   | GGC G   | C
G | GUA V   | GCA A   | GAA E   | GGA G   | A
G | GUG V   | GCG A   | GAG E   | GGG G   | G
--+---------