In [1]:
from Bio.Seq import Seq

tatabox_seq = Seq('tataaaggcAATATGCAGTTAG')
print(tatabox_seq)
print(type(tatabox_seq))

tataaaggcAATATGCAGTTAG
<class 'Bio.Seq.Seq'>


In [2]:
from Bio.Seq import Seq

exon_seq = Seq('ATGCAGTAG')
count_a = exon_seq.count('A')
count_a

3

In [3]:
from Bio.Seq import Seq

g_count = exon_seq.count('G')
c_count = exon_seq.count('C')

gc_contents = (g_count + c_count) / len(exon_seq) * 100
gc_contents

44.44444444444444

In [4]:
from Bio.Seq import Seq

tatabox_seq = Seq('tataaaggcAATATGCAGTTAG')
print(tatabox_seq.upper())
print(tatabox_seq.lower())

TATAAAGGCAATATGCAGTTAG
tataaaggcaatatgcagttag


In [5]:
from Bio.Seq import Seq

dna = Seq('ATGCAGTAG')
mrna = dna.transcribe()
ptn = dna.translate()

print(mrna, ptn)

AUGCAGUAG MQ*


In [6]:
mrna = Seq('AUGAACUAAGUUUAGAAU')
ptn = mrna.translate()
ptn

Seq('MN*V*N')

In [7]:
ptn = mrna.translate(to_stop=True)
ptn

Seq('MN')

In [8]:
mrna = Seq('AUGAACUAAGUUUAGAAU')
ptn = mrna.translate()
print(ptn)
for seq in ptn.split('*'):
    print(seq)

MN*V*N
MN
V
N


In [9]:
seq = Seq('TATAAGGCAATATGCAGTAG')
com_seq = seq.complement()
rev_comp_seq = seq.reverse_complement()
print(com_seq, rev_comp_seq)

ATATTCCGTTATACGTCATC CTACTGCATATTGCCTTATA


In [10]:
from Bio.Data import CodonTable

codon_table = CodonTable.unambiguous_dna_by_name['Standard']
print(codon_table)

Table 1 Standard, SGC0

  |  T      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
T | TTT F   | TCT S   | TAT Y   | TGT C   | T
T | TTC F   | TCC S   | TAC Y   | TGC C   | C
T | TTA L   | TCA S   | TAA Stop| TGA Stop| A
T | TTG L(s)| TCG S   | TAG Stop| TGG W   | G
--+---------+---------+---------+---------+--
C | CTT L   | CCT P   | CAT H   | CGT R   | T
C | CTC L   | CCC P   | CAC H   | CGC R   | C
C | CTA L   | CCA P   | CAA Q   | CGA R   | A
C | CTG L(s)| CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | ATT I   | ACT T   | AAT N   | AGT S   | T
A | ATC I   | ACC T   | AAC N   | AGC S   | C
A | ATA I   | ACA T   | AAA K   | AGA R   | A
A | ATG M(s)| ACG T   | AAG K   | AGG R   | G
--+---------+---------+---------+---------+--
G | GTT V   | GCT A   | GAT D   | GGT G   | T
G | GTC V   | GCC A   | GAC D   | GGC G   | C
G | GTA V   | GCA A   | GAA E   | GGA G   | A
G | GTG V   | GCG A   | GAG E   | GGG G   | G
--+---------

In [11]:
codon_table = CodonTable.unambiguous_dna_by_name['Vertebrate Mitochondrial']
print(codon_table)

Table 2 Vertebrate Mitochondrial, SGC1

  |  T      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
T | TTT F   | TCT S   | TAT Y   | TGT C   | T
T | TTC F   | TCC S   | TAC Y   | TGC C   | C
T | TTA L   | TCA S   | TAA Stop| TGA W   | A
T | TTG L   | TCG S   | TAG Stop| TGG W   | G
--+---------+---------+---------+---------+--
C | CTT L   | CCT P   | CAT H   | CGT R   | T
C | CTC L   | CCC P   | CAC H   | CGC R   | C
C | CTA L   | CCA P   | CAA Q   | CGA R   | A
C | CTG L   | CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | ATT I(s)| ACT T   | AAT N   | AGT S   | T
A | ATC I(s)| ACC T   | AAC N   | AGC S   | C
A | ATA M(s)| ACA T   | AAA K   | AGA Stop| A
A | ATG M(s)| ACG T   | AAG K   | AGG Stop| G
--+---------+---------+---------+---------+--
G | GTT V   | GCT A   | GAT D   | GGT G   | T
G | GTC V   | GCC A   | GAC D   | GGC G   | C
G | GTA V   | GCA A   | GAA E   | GGA G   | A
G | GTG V(s)| GCG A   | GAG E   | GGG G   

In [12]:
from Bio.SeqUtils import GC

exon_seq = Seq('ATGCAGTAG')
gc_contents = GC(exon_seq)
print(gc_contents)

44.44444444444444


In [13]:
from Bio.SeqUtils import six_frame_translations

seq1 = Seq('ATGCCTTGAAATGTATAG')
print(six_frame_translations(seq1))

GC_Frame: a:6 t:6 g:4 c:2 
Sequence: atgccttgaaatgtatag, 18 nt, 33.33 %GC


1/1
  A  L  K  C  I
 C  L  E  M  Y
M  P  *  N  V  *
atgccttgaaatgtatag   33 %
tacggaactttacatatc
G  Q  F  T  Y 
 H  R  S  I  Y  L
  A  K  F  H  I




In [14]:
from Bio.SeqUtils import MeltingTemp as mt

print(mt.Tm_Wallace(seq1))

48.0


In [15]:
from Bio.SeqUtils import seq1

essential_amino_acid_3 = 'LeuLysMetValIleThrTrpPhe'
print(seq1(essential_amino_acid_3))

LKMVITWF
