<a href="https://colab.research.google.com/github/pchroscicki/Basic-Bioinformatics/blob/main/biopython.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [6]:
pip install biopython



# **Importing a sequence**

In [8]:
from Bio import SeqIO

# Open the FASTA file and parse the sequence
filename = "tom40.fasta"
for record in SeqIO.parse(filename, "fasta"):
    sequence = record.seq
    print(sequence)

MSAPTPLAEASQIPTIPALSPLTAKQSKGNFFSSNPISSFVVDTYKQLHSHRQSLELVNPGTVENLNKEVSRDVFLSQYFFTGLRADLNKAFSMNPAFQTSHTFSIGSQALPKYAFSALFANDNLFAQGNIDNDLSVSGRLNYGWDKKNISKVNLQISDGQPTMCQLEQDYQASDFSVNVKTLNPSFSEKGEFTGVAVASFLQSVTPQLALGLETLYSRTDGSAPGDAGVSYLTRYVSKKQDWIFSGQLQANGALIASLWRKVAQNVEAGIETTLQAGMVPITDPLMGTPIGIQPTVEGSTTIGAKYEYRQSVYRGTLDSNGKVACFLERKVLPTLSVLFCGEIDHFKNDTKIGCGLQFETAGNQELLMLQQGLDADGNPLQALPQL


# **Reverse complement**

In [9]:
from Bio.Seq import Seq

# Create a DNA sequence
sequence = Seq("ATCGGTAATGATAGATGA")

# Get the reverse complement
reverse_complement = sequence.reverse_complement()

# Print the reverse complement
print(reverse_complement)

TCATCTATCATTACCGAT


# **Transcription (DNA to RNA)**

In [10]:
from Bio.Seq import Seq

# Create a DNA sequence
dna_sequence = Seq("ATCGGTAATGATAGATGA")

# Perform transcription
rna_sequence = dna_sequence.transcribe()

# Print the RNA sequence
print(rna_sequence)

AUCGGUAAUGAUAGAUGA



# **Translation (DNA/RNA to protein)**

In [11]:
from Bio.Seq import Seq

# Create a DNA sequence
dna_sequence = Seq("ATGGGTAATGATAGATGA")

# Perform translation to protein
protein_sequence = dna_sequence.translate()

# Print the protein sequence
print(protein_sequence)

MGNDR*


# Sequence Alignment

In [12]:
from Bio import Align

# Create a pairwise sequence aligner
aligner = Align.PairwiseAligner()

# Add sequences to align
seq1 = "ACGTTAGATAGTAGTGATGATGTGATG"
seq2 = "ACTAG"
alignments = aligner.align(seq1, seq2)

# Print the alignments
for alignment in alignments:
    print(alignment)

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||-|-||-------------------- 27
query             0 AC-T-AG--------------------  5

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||--|||-------------------- 27
query             0 AC--TAG--------------------  5

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||-|-|----|---------------- 27
query             0 AC-T-A----G----------------  5

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||--||----|---------------- 27
query             0 AC--TA----G----------------  5

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||-|---|--|---------------- 27
query             0 AC-T---A--G----------------  5

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||--|--|--|---------------- 27
query             0 AC--T--A--G----------------  5

target            0 ACGTTAGATAGTAGTGATGATGTGATG 27
                  0 ||-|-


# **Sequence Comparison biopython**

In [13]:
from Bio import pairwise2
from Bio.Seq import Seq

# Create two DNA sequences
seq1 = Seq("ATCGGTA")
seq2 = Seq("ATGGTCA")

# Perform pairwise sequence alignment
alignments = pairwise2.align.globalxx(seq1, seq2)

# Print the alignments
for alignment in alignments:
    print(pairwise2.format_alignment(*alignment))

ATCGGT-A
|| ||| |
AT-GGTCA
  Score=6



