# **Exercício BioPython Parte I: Curso python para bioinformática**

In [None]:
!pip install biopython

Collecting biopython
[?25l  Downloading https://files.pythonhosted.org/packages/76/02/8b606c4aa92ff61b5eda71d23b499ab1de57d5e818be33f77b01a6f435a8/biopython-1.78-cp36-cp36m-manylinux1_x86_64.whl (2.3MB)
[K     |████████████████████████████████| 2.3MB 7.8MB/s 
Installing collected packages: biopython
Successfully installed biopython-1.78


In [None]:
from Bio.Seq import Seq #permite definir sequencias biologicas

In [None]:
sequence = Seq('TCGATCAGCTAGCATGCATCA')
sequence

Seq('TCGATCAGCTAGCATGCATCA')

In [None]:
sequence.transcribe()

Seq('UCGAUCAGCUAGCAUGCAUCA')

In [None]:
sequence.translate()

Seq('SIS*HAS')

In [None]:
sequence.reverse_complement()

Seq('TGATGCATGCTAGCTGATCGA')

In [None]:
sequence[0:3]

Seq('TCG')

In [None]:
#permite definir uma sequencia, contendo anotações sobre ela
from Bio.SeqRecord import SeqRecord
from Bio.SeqFeature import SeqFeature, FeatureLocation

In [None]:
sequence = Seq('ATGGCAAAAGAGTGA') #sequencia de 15 aminoacidos, 5 codons
features = [
            SeqFeature(FeatureLocation(0, 15, strand=1), type = 'gene',
                       qualifiers={'locus_tag': ['omx_0001'], 'gene': ['omX']})
           ]

record = SeqRecord(
              sequence,
              id = 'OMX001.1',
              name = 'omX',
              description = 'omixicin',
              annotations = {'molecule_type': 'DNA'},
              features = features
          )

In [None]:
record

SeqRecord(seq=Seq('ATGGCAAAAGAGTGA'), id='OMX001.1', name='omX', description='omixicin', dbxrefs=[])

In [None]:
print(record.format('genbank'))

LOCUS       omX                       15 bp    DNA              UNK 01-JAN-1980
DEFINITION  omixicin.
ACCESSION   OMX001
VERSION     OMX001.1
KEYWORDS    .
SOURCE      .
  ORGANISM  .
            .
FEATURES             Location/Qualifiers
     gene            1..15
                     /locus_tag="omx_0001"
                     /gene="omX"
ORIGIN
        1 atggcaaaag agtga
//



In [None]:
print(record.format('embl'))

ID   OMX001; SV 1; ; DNA; ; UNC; 15 BP.
XX
AC   OMX001;
XX
DE   omixicin
XX
OS   .
OC   .
XX
FH   Key             Location/Qualifiers
FH
FT   gene            1..15
FT                   /locus_tag="omx_0001"
FT                   /gene="omX"
XX
SQ   Sequence 15 BP; 7 A; 1 C; 5 G; 2 T; 0 other;
     atggcaaaag agtga                                                         15
//



In [None]:
print(record.format('fasta'))

>OMX001.1 omixicin
ATGGCAAAAGAGTGA



In [None]:
from Bio import SeqIO

In [None]:
with open('annotation.gb', 'w') as writer:
  SeqIO.write([record], writer, 'genbank')

In [None]:
with open('annotation.gb', 'r') as reader:
  parser = SeqIO.parse(reader, 'genbank')
  for record in parser:
    print(record.id)
    for feature in record.features:
      print(feature.type, feature.location.start, feature.location.end)

OMX001.1
gene 0 15
