# QUAST Assessment for FLYE Chr 22 5mb

In [16]:
# imports
# Biopython imports
from Bio.Seq import Seq
from Bio.SeqRecord import SeqRecord
from Bio.Alphabet import DNAAlphabet
from Bio import SeqIO

In [1]:
# obtain all contigs to one file
project_name = "chr22"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa"

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/chr22/contigs/contig_1' \
'../Improving_Assembly_Graph/chr22/contigs/contig_2' \
'../Improving_Assembly_Graph/chr22/contigs/contig_3' \
'../Improving_Assembly_Graph/chr22/contigs/contig_4' \
'../Improving_Assembly_Graph/chr22/contigs/contig_5' \
> ./"$project_name"/contigs/contigs.fasta 

!quast.py -a all -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

!minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all -o ./chr22/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa -t 16 ./chr22/contigs/contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-02 09:42:55

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/chr22/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa ==> chr22_5mb

Contigs:
  Pre-processing...
  ./chr22/contigs/c

In [33]:
# chunk and align

# obtain all contigs to one file
project_name = "chr22_chunk_align"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa"

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
!mkdir "$project_name/chunks"

chunks = []
with open(reference_genome, 'r') as f:
    content = f.read().strip().split('\n')
    content.pop(0)
    
    string = "".join(content)
    index = 0
    
    while index < len(string):
        chunks.append(string[index:index+10000].upper())
        index += 5000

chunk_index = 0
records = []
for c in chunks:
    r = SeqRecord(Seq(c, DNAAlphabet), id="Chunk_"+str(chunk_index), description="Generated Chunk" + str(chunk_index) + "-" + str(chunk_index + 10000))
    SeqIO.write(r, project_name+"/chunks/"+str(chunk_index) + ".fa", "fasta")
    chunk_index += 5000
    records.append(r)

SeqIO.write(records, project_name+"/chunks/all.fa", "fasta")

![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/chr22/contigs/contig_1' \
'../Improving_Assembly_Graph/chr22/contigs/contig_2' \
'../Improving_Assembly_Graph/chr22/contigs/contig_3' \
'../Improving_Assembly_Graph/chr22/contigs/contig_4' \
'../Improving_Assembly_Graph/chr22/contigs/contig_5' \
> ./"$project_name"/contigs/contigs.fasta 

# !quast.py -a all -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

!minimap2 -a "$project_name"/chunks/all.fa ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# # !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# # !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

[M::mm_idx_gen::0.303*1.00] collected minimizers
[M::mm_idx_gen::0.392*1.37] sorted minimizers
[M::main::0.392*1.37] loaded/built the index for 1000 target sequence(s)
[M::mm_mapopt_update::0.408*1.36] mid_occ = 206
[M::mm_idx_stat] kmer size: 15; skip: 10; is_hpc: 0; #seq: 1000
[M::mm_idx_stat::0.418*1.35] distinct minimizers: 799170 (0.43% are singletons); average occurrences: 2.359; average spacing: 5.302
[M::worker_pipeline::12.922*1.05] mapped 5 sequences
[M::main] Version: 2.14-r886-dirty
[M::main] CMD: minimap2 -a chr22_chunk_align/chunks/all.fa ./chr22_chunk_align/contigs/contigs.fasta
[M::main] Real time: 12.928 sec; CPU: 13.638 sec; Peak RSS: 0.305 GB


# QUAST Assessment for Canu Chr 22 5mb

In [15]:
# obtain all contigs to one file
project_name = "chr22canu"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa"


![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval 

!quast.py -a all -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Canu/Out Chr22/r1.contigs.fasta"

!minimap2 -a "$reference_genome" "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Canu/Out Chr22/r1.contigs.fasta" > ./"$project_name"/mappings/CANU_alignment.sam
!samtools sort ./"$project_name"/mappings/CANU_alignment.sam > ./"$project_name"/mappings/CANU_alignment.sorted.bam
!samtools index -b ./"$project_name"/mappings/CANU_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all -o ./chr22canu/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa -t 16 /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Canu/Out Chr22/r1.contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-42-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2018-12-20 14:00:14

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/chr22canu/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22

In [14]:
# obtain all contigs to one file
project_name = "r4"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/G4.fa"

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings

!cat \
'/media/anuradhawick/data/Experiments/Assembly_Graph/Improving_Assembly_Graph/simG4/contigs/contig_1' \
'/media/anuradhawick/data/Experiments/Assembly_Graph/Improving_Assembly_Graph/simG4/contigs/contig_2' \
'/media/anuradhawick/data/Experiments/Assembly_Graph/Improving_Assembly_Graph/simG4/contigs/contig_3' \
> ./"$project_name"/contigs/contigs.fasta 


!quast.py -a all -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

!minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all -o ./r4/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/G4.fa -t 16 ./r4/contigs/contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-42-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2018-12-20 13:59:31

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/r4/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/G4.fa ==> G4

Contigs:
  Pre-processing...
  ./r4/contigs/contigs.fasta ==> contigs

2018-12

In [3]:
project_name = "chr22_contig5"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa"
 

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/chr22/contigs/contig_4' \
> ./"$project_name"/contigs/contigs.fasta 

!quast.py -a all --ambiguity-score 0.8 -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 "../Improving_Assembly_Graph/chr22/contigs/contig_5"

# !minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all --ambiguity-score 0.8 -o ./chr22_contig5/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa -t 16 ../Improving_Assembly_Graph/chr22/contigs/contig_5

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-02 09:47:03

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/chr22_contig5/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa ==> 

In [6]:
project_name = "chr22_contig4"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa"
 

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/chr22/contigs/contig_4' \
> ./"$project_name"/contigs/contigs.fasta 

!quast.py -a all --ambiguity-score 0.8 -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

# !minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all --ambiguity-score 0.8 -o ./chr22_contig4/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa -t 16 ./chr22_contig4/contigs/contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-02 09:49:53

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/chr22_contig4/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/chr22_5mb.fa ==> chr22_5mb

Co

In [8]:
project_name = "chr22_contig4to2"
reference_genome = '../Improving_Assembly_Graph/chr22/contigs/contig_2'
 

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/chr22/contigs/contig_4' \
> ./"$project_name"/contigs/contigs.fasta 

!quast.py -a all --ambiguity-score 0.8 -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

!minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all --ambiguity-score 0.8 -o ./chr22_contig4to2/quast_eval/ -r ../Improving_Assembly_Graph/chr22/contigs/contig_2 -t 16 ./chr22_contig4to2/contigs/contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-02 09:53:01

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/chr22_contig4to2/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Improving_Assembly_Graph/chr22/contigs/contig_2 ==> contig_2

Contigs:
  Pre-proces

In [10]:
project_name = "chr22_flye_to_canu"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/canu_contigs_chr22/canutig22.fasta"
 

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval


!quast.py -a all --ambiguity-score 0.8 -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 "/media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/canu_contigs_chr22/flye2_4_5.fasta"
!minimap2 -a "$reference_genome" "/media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/canu_contigs_chr22/flye2_4_5.fasta" > ./"$project_name"/mappings/alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all --ambiguity-score 0.8 -o ./chr22_flye_to_canu/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/canu_contigs_chr22/canutig22.fasta -t 16 /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/canu_contigs_chr22/flye2_4_5.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-03 16:10:53

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/chr22_flye_to_canu/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size

# Yeast Genome Contig Realignment

In [14]:
project_name = "yeastgenome"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa"

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/yeast/contigs/contig_1' \
'../Improving_Assembly_Graph/yeast/contigs/contig_2' \
'../Improving_Assembly_Graph/yeast/contigs/contig_3' \
'../Improving_Assembly_Graph/yeast/contigs/contig_4' \
'../Improving_Assembly_Graph/yeast/contigs/contig_5' \
'../Improving_Assembly_Graph/yeast/contigs/contig_6' \
'../Improving_Assembly_Graph/yeast/contigs/contig_7' \
'../Improving_Assembly_Graph/yeast/contigs/contig_8' \
'../Improving_Assembly_Graph/yeast/contigs/contig_9' \
'../Improving_Assembly_Graph/yeast/contigs/contig_10' \
'../Improving_Assembly_Graph/yeast/contigs/contig_11' \
'../Improving_Assembly_Graph/yeast/contigs/contig_12' \
'../Improving_Assembly_Graph/yeast/contigs/contig_13' \
'../Improving_Assembly_Graph/yeast/contigs/contig_14' \
'../Improving_Assembly_Graph/yeast/contigs/contig_15' \
'../Improving_Assembly_Graph/yeast/contigs/contig_16' \
'../Improving_Assembly_Graph/yeast/contigs/contig_17' \
'../Improving_Assembly_Graph/yeast/contigs/contig_18' \
> ./"$project_name"/contigs/contigs.fasta 

!quast.py -a all --ambiguity-score 0.8 -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

!minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all --ambiguity-score 0.8 -o ./yeastgenome/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa -t 16 ./yeastgenome/contigs/contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-04 13:35:20

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/yeastgenome/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa ==> Yea

In [15]:
project_name = "yeastgenome_refinedgraph"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa"

![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/contigs ] && mkdir "$project_name"/contigs
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval

!cat \
'../Improving_Assembly_Graph/yeast/contigs/contig_1' \
'../Improving_Assembly_Graph/yeast/contigs/contig_2' \
'../Improving_Assembly_Graph/yeast/contigs/contig_3' \
'../Improving_Assembly_Graph/yeast/contigs/contig_4' \
'../Improving_Assembly_Graph/yeast/contigs/contig_5' \
'../Improving_Assembly_Graph/yeast/contigs/contig_6' \
'../Improving_Assembly_Graph/yeast/contigs/contig_15' \
> ./"$project_name"/contigs/contigs.fasta 

!quast.py -a all --ambiguity-score 0.8 -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 ./"$project_name"/contigs/contigs.fasta

!minimap2 -a "$reference_genome" ./"$project_name"/contigs/contigs.fasta > ./"$project_name"/mappings/FLYE_alignment.sam
# !samtools sort ./"$project_name"/mappings/FLYE_alignment.sam > ./"$project_name"/mappings/FLYE_alignment.sorted.bam
# !samtools index -b ./"$project_name"/mappings/FLYE_alignment.sorted.bam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all --ambiguity-score 0.8 -o ./yeastgenome_refinedgraph/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa -t 16 ./yeastgenome_refinedgraph/contigs/contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-04 13:35:43

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/yeastgenome_refinedgraph/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Samp

In [34]:
# obtain all contigs to one file
project_name = "yeastcanu"
reference_genome = "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa"


![ -e "$project_name" ] && rm -r "$project_name"
!mkdir "$project_name"
![ ! -e "$project_name"/mappings ] && mkdir "$project_name"/mappings
![ ! -e "$project_name"/quast_eval ] && mkdir "$project_name"/quast_eval 

!quast.py -a all -o ./"$project_name"/quast_eval/ -r "$reference_genome" -t 16 "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Canu/Out Yeast/r1.contigs.fasta"

# !minimap2 -a "$reference_genome" "/media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Canu/Out Yeast/r1.contigs.fasta" > ./"$project_name"/mappings/CANU_alignment.sam

/home/anuradhawick/anaconda3/lib/python3.6/site-packages/quast-5.0.2-py3.6.egg/EGG-INFO/scripts/quast.py -a all -o ./yeastcanu/quast_eval/ -r /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genomes/yeast/YeastGenome.fa -t 16 /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Canu/Out Yeast/r1.contigs.fasta

Version: 5.0.2

System information:
  OS: Linux-4.15.0-43-generic-x86_64-with-debian-buster-sid (linux_64)
  Python version: 3.6.5
  CPUs number: 8

Started: 2019-01-04 16:44:53

Logging to /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations/yeastcanu/quast_eval/quast.log

CWD: /media/anuradhawick/data/Experiments/Assembly_Graph/Estimating_actual_contig_locations
Main parameters: 
  MODE: default, threads: 16, minimum contig length: 500, minimum alignment length: 65, \
  ambiguity: all, threshold for extensive misassembly size: 1000

Reference:
  /media/anuradhawick/data/Experiments/Assembly_Graph/Assembly/Sample_Genom