## Before starting: 
### 1. prepare the design spread sheet corresponding to the experiment
### 2. create an empty folder for this NGS run
### 3. make a copy of this note book inside the run folder
### 4. place .fasta.gz files in the "raw_reads" folder, under the run folder

In [None]:
%matplotlib inline

# >>>>>>>>>> INPUT >>>>>>>>>>

config = {
    # e.g., SP5-0515_S53 correspond to 
    # SP5-0515_S53_L001_R1_001.fastq.gz and SP5-0515_S53_L001_R2_001.fastq.gz
    'lib_list': [
        'SP5-0515_S53',
        'SP6-0515_S54',
        'US5-0515_S49',
        'US6-0515_S50',
        'WR3-0515_S51',
        'WR4-0515_S52',
    ], 

    # Sequencing platform
    'sequencer': 'MiSeq', # MiSeq or else
    
    # panel information
    'design_file_path': '../Olivar-multi preliminary design 102723-2 formated.xlsx', # path to the design spread sheet
    'panel_type': 'legacy', # default: 'legacy'
    'total_tube': 1, # number of tubes (primer pools)
    
    # fastq path format (NOTE: need to change format if merged from multiple lanes)
    'r1_path_format': 'raw_reads/%s_L001_R1_001.fastq.gz',  # %s is library name
    'r2_path_format': 'raw_reads/%s_L001_R2_001.fastq.gz', 
    
    # output
    'verbose': True, # print in notebook
    'to_plot': False, # show plots in notebook
    'keep_sam': False, # keep sam files
    'save_raw_UMI': True, # save UMI grouping file
    
    # performace
    'performace_level': 1, # 1 to use fewer RAM and half of all logic cores, 2 to use more RAM and all cores
    # e.g., set to 1 when running on a laptop with hyperthreading, or 2 when running on AWS or workstation
    
    # function block switches
    'BUILD_INDEX': True, # bowtie2 index, homopolymer coordinates, primer head hash table
    'TRIM_ALIGN_SWITCH': True, # adapter trim & bowtie2 alignment (necessary for other function blocks)
    'UMI_SWITCH': True, # UMI grouping, UMI voting and variant call (need bam files)
    'UNIFORMITY_SWITCH': True, # uniformity a nalysis and plots (need bam files)
    'DIMER_SWITCH': True, # dimer analysis and plots (need dimer.fastq.gz)
    'NS_SWITCH': True # non-specific analysis and plots (need bam files)
}

# <<<<<<<<<< INPUT <<<<<<<<<<


from QASeq import analysis
analysis(config)