## Putting final touches on Crimson Glory genome assembly.

#### Need to make sure the scaffolds are named after the chromosomes of *Eucalyptus grandis* and that the scaffolds are all in the correct order/orientation.

#### Using most recent genome assembly by Australian National University found here: 
https://www.ncbi.nlm.nih.gov/datasets/genome/GCF_016545825.1/



In [14]:
## Set up

WKDIR=/workspace/hraijc/Manuka/CrismsonGlory_V2/Genome_Assembly/
EG_ASSEMBLY=/workspace/ComparativeDataSources/Myrtaceae/Eucalyptus/grandis/Genome/ASM1654582v1/ncbi_dataset/data/GCF_016545825.1/GCF_016545825.1_ASM1654582v1_genomic.fna
DRAFT=/workspace/hraijc/Manuka/CrismsonGlory_V2/Genome_Assembly/manuka_CG_Hybrid_v2d_100kb.fasta

In [15]:
#mkdir -p ${WKDIR}/log
cd $WKDIR

In [3]:
#map to E. grandis reference.

sbatch << EOF
#!/bin/bash
#SBATCH -J minimap
#SBATCH -o ${WKDIR}/log/%J.out
#SBATCH -e ${WKDIR}/log/%J.err
#SBATCH --cpus-per-task=4
#SBATCH --mem=2G
#SBATCH --time=01:10:00

module load minimap2

minimap2 -t 4 -cx asm10 ${DRAFT} ${EG_ASSEMBLY} > ManukaV2d100kb_EgrandisASM1654582v1_asm10.paf 
EOF

Submitted batch job 2009545


### AssemblyQC

In [16]:
cd ${WKDIR}/assembly_qc/

In [17]:
grep -v "//" nextflow.config

includeConfig './conf/base.config'

params {
    
    target_assemblies       = [
        ["manuka_CG_Hybrid_v2d_100kb", "/workspace/hraijc/Manuka/CrismsonGlory_V2/Genome_Assembly/manuka_CG_Hybrid_v2d_100kb.fasta"]
    ]

    assembly_gff3           = []
    
    assemblathon_stats {
        n_limit             = 100
    }

    ncbi_fcs_adaptor {


    }

    ncbi_fcs_gx {
        skip                = 1

        tax_id              = "78410"

        db_path             = "/workspace/ComparativeDataSources/NCBI/FCS/GX/r2023-01-24"

    }
    
    busco {
        skip                = 0

        mode                = "geno"
        
        lineage_datasets    = ["embryophyta_odb10"]

        download_path       = "/workspace/ComparativeDataSources/BUSCO/assembly_qc"
    }

    tidk {
        skip                = 0
        
        repeat_seq          = "TTTAGGG"

        filter_by_size      = 0

        filter_size_bp      = 1000000
    }

    lai {
        skip                = 0

 

In [18]:
sbatch ./assembly_qc_pfr.sh

Submitted batch job 2009931
