# Housekeeping Gene Working

In [1]:
from Bio.Seq import Seq

In [4]:
hk_seq = Seq("AGCCATTTCTACTTTGCCCGCCCACAGATGTA")
count_A = hk_seq.count("A")
count_T = hk_seq.count("T")
count_C = hk_seq.count("C")
count_G = hk_seq.count("G")
print(count_A)
print(count_T)
print(count_C)
print(count_G)

7
9
11
5


# GC-contents 계산

In [12]:
print(len(hk_seq)) #housekeeping 유전자 전체 서열의 개수 세기

32


In [11]:
count_G = hk_seq.count("G")
count_C = hk_seq.count("C")
GC_contents = (count_G + count_C) / len(hk_seq) * 100
print(GC_contents) # 전체32개 서열중에 G와 C의 % 함량 구하기

50.0


# Housekeeping Gene 전사와 번역하기

In [15]:
dna = Seq("AGCCATTTCTACTTTGCCCGCCCACAGATGTA")
mrna = dna.transcribe()
protein = dna.translate()
print(dna) # DNA 서열보기
print(mrna) # 전사된 mRNA 서열보기
print(protein) # 번역된 아미노산 서열보기

AGCCATTTCTACTTTGCCCGCCCACAGATGTA
AGCCAUUUCUACUUUGCCCGCCCACAGAUGUA
SHFYFARPQM


# 코돈표 출력하기

In [10]:
from Bio.Data import CodonTable

In [11]:
codon_table = CodonTable.unambiguous_dna_by_name["Standard"]
print(codon_table)
print(codon_table.stop_codons)

Table 1 Standard, SGC0

  |  T      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
T | TTT F   | TCT S   | TAT Y   | TGT C   | T
T | TTC F   | TCC S   | TAC Y   | TGC C   | C
T | TTA L   | TCA S   | TAA Stop| TGA Stop| A
T | TTG L(s)| TCG S   | TAG Stop| TGG W   | G
--+---------+---------+---------+---------+--
C | CTT L   | CCT P   | CAT H   | CGT R   | T
C | CTC L   | CCC P   | CAC H   | CGC R   | C
C | CTA L   | CCA P   | CAA Q   | CGA R   | A
C | CTG L(s)| CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | ATT I   | ACT T   | AAT N   | AGT S   | T
A | ATC I   | ACC T   | AAC N   | AGC S   | C
A | ATA I   | ACA T   | AAA K   | AGA R   | A
A | ATG M(s)| ACG T   | AAG K   | AGG R   | G
--+---------+---------+---------+---------+--
G | GTT V   | GCT A   | GAT D   | GGT G   | T
G | GTC V   | GCC A   | GAC D   | GGC G   | C
G | GTA V   | GCA A   | GAA E   | GGA G   | A
G | GTG V   | GCG A   | GAG E   | GGG G   | G
--+---------

In [12]:
mitochondrial_table = CodonTable.unambiguous_dna_by_name["Vertebrate Mitochondrial"]
print(mitochondrial_table)
print(mitochondrial_table.stop_codons)

Table 2 Vertebrate Mitochondrial, SGC1

  |  T      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
T | TTT F   | TCT S   | TAT Y   | TGT C   | T
T | TTC F   | TCC S   | TAC Y   | TGC C   | C
T | TTA L   | TCA S   | TAA Stop| TGA W   | A
T | TTG L   | TCG S   | TAG Stop| TGG W   | G
--+---------+---------+---------+---------+--
C | CTT L   | CCT P   | CAT H   | CGT R   | T
C | CTC L   | CCC P   | CAC H   | CGC R   | C
C | CTA L   | CCA P   | CAA Q   | CGA R   | A
C | CTG L   | CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | ATT I(s)| ACT T   | AAT N   | AGT S   | T
A | ATC I(s)| ACC T   | AAC N   | AGC S   | C
A | ATA M(s)| ACA T   | AAA K   | AGA Stop| A
A | ATG M(s)| ACG T   | AAG K   | AGG Stop| G
--+---------+---------+---------+---------+--
G | GTT V   | GCT A   | GAT D   | GGT G   | T
G | GTC V   | GCC A   | GAC D   | GGC G   | C
G | GTA V   | GCA A   | GAA E   | GGA G   | A
G | GTG V(s)| GCG A   | GAG E   | GGG G   

# Housekeeping Gene 상보적 / 역상보적 서열 만들기

* 5' - AGCCATTTCTACTTTGCCCGCCCACAGATGTA - 3'
* 3' -                                  - 5'

In [25]:
hk_seq = Seq("AGCCATTTCTACTTTGCCCGCCCACAGATGTA")
comp_seq = hk_seq.complement()

print(comp_seq) # 상보적 서열이 출력되므로 상단 마크다운에 서열 붙여넣기


TCGGTAAAGATGAAACGGGCGGGTGTCTACAT


In [27]:
rev_comp_seq = hk_seq.reverse_complement()
print(rev_comp_seq) # 역상보적 서열이 출력된다

TACATCTGTGGGCGGGCAAAGTAGAAATGGCT
