In [1]:
import datablocks
from datablocks import DB, signature
import micron, micron.datasets

# BIOPYTHON: ALIGN

In [5]:
from Bio import pairwise2
from Bio.Seq import Seq

In [6]:
seq1 = Seq("ACCGGT") 
seq2 = Seq("ACGT")

In [7]:
alignments = pairwise2.align.globalxx(seq1, seq2)

In [8]:
alignments

[Alignment(seqA='ACCGGT', seqB='A-C-GT', score=4.0, start=0, end=6),
 Alignment(seqA='ACCGGT', seqB='AC--GT', score=4.0, start=0, end=6),
 Alignment(seqA='ACCGGT', seqB='A-CG-T', score=4.0, start=0, end=6),
 Alignment(seqA='ACCGGT', seqB='AC-G-T', score=4.0, start=0, end=6)]

In [9]:
for alignment in alignments: 
    print(pairwise2.format_alignment(*alignment)) 

ACCGGT
| | ||
A-C-GT
  Score=4

ACCGGT
||  ||
AC--GT
  Score=4

ACCGGT
| || |
A-CG-T
  Score=4

ACCGGT
|| | |
AC-G-T
  Score=4



## Preferred ALIGN usage

In [13]:
from Bio import Align
aligner = Align.PairwiseAligner()
aligner

Pairwise aligner, implementing the Needleman-Wunsch, Smith-Waterman, Gotoh, and Waterman-Smith-Beyer global and local alignment algorithms

In [14]:
print(aligner)

Pairwise sequence aligner with parameters
  wildcard: None
  match_score: 1.000000
  mismatch_score: 0.000000
  target_internal_open_gap_score: 0.000000
  target_internal_extend_gap_score: 0.000000
  target_left_open_gap_score: 0.000000
  target_left_extend_gap_score: 0.000000
  target_right_open_gap_score: 0.000000
  target_right_extend_gap_score: 0.000000
  query_internal_open_gap_score: 0.000000
  query_internal_extend_gap_score: 0.000000
  query_left_open_gap_score: 0.000000
  query_left_extend_gap_score: 0.000000
  query_right_open_gap_score: 0.000000
  query_right_extend_gap_score: 0.000000
  mode: global



### score

In [12]:
target = "GAACT"
query = "GAT"
score = aligner.score(target, query)
score

3.0

### alignments

In [15]:
alignments = aligner.align(target, query)
for alignment in alignments:
    print(alignment)

target            0 GAACT 5
                  0 ||--| 5
query             0 GA--T 3

target            0 GAACT 5
                  0 |-|-| 5
query             0 G-A-T 3



### local

In [17]:
aligner.mode = "local"
target = "AGAACTC"
query = "GAACT"
score = aligner.score(target, query)
score

5.0

In [18]:
alignments = aligner.align(target, query)
for alignment in alignments:
     print(alignment)

target            1 GAACT 6
                  0 ||||| 5
query             0 GAACT 5



# DATASETS