In [1]:
import json
from cosap import Pipeline, FastqReader, Mapper, VariantCaller, version, PipelineRunner, MDUP,Recalibrator
from cosap import VarScanVariantCaller
import yaml
version

'0.0.1'

In [2]:
germline_files = [
    FastqReader("/media/mae/SeagateExpansionDrive/arif/case_1_germline_wes/SRR3182423_1.fastq.gz", platform="illumina", read=1),
    FastqReader("/media/mae/SeagateExpansionDrive/arif/case_1_germline_wes/SRR3182423_1.fastq.gz", platform="illumina", read=2)
]

tumor_files = [
    FastqReader("/media/mae/SeagateExpansionDrive/arif/case_1_biorep_a_wes/SRR3182433_1.fastq.gz", platform="illumina", read=1),
    FastqReader("/media/mae/SeagateExpansionDrive/arif/case_1_biorep_a_wes/SRR3182433_2.fastq.gz", platform="illumina", read=2)
]

In [3]:
mapper_germline = Mapper(library="bwa", reads=germline_files, params={
    "read_groups": {
        "ID": "Pt28N",
        "SM": "Pt28N",
        "PU": "0",
        "PL": "illumina",
        "LB": "Pt28N"
    }
})
mapper_tumor = Mapper(library="bwa", reads=tumor_files, params={
    "read_groups": {
        "ID": "S13",
        "SM": "S13",
        "PU": "0",
        "PL": "illumina",
        "LB": "S13"
    }
})

In [4]:
mdup_germline = MDUP(input_step=mapper_germline)
mdup_tumor = MDUP(input_step=mapper_tumor)

In [5]:
base_racalibrator_germline = Recalibrator(input_step=mdup_germline)
base_racalibrator_tumor = Recalibrator(input_step=mdup_tumor)

In [6]:
caller1 = VariantCaller(library="mutect", germline=base_racalibrator_germline, tumor=base_racalibrator_tumor, params={})
caller2 = VariantCaller(library="varscan", germline=base_racalibrator_germline, tumor=base_racalibrator_tumor, params={})

In [7]:
pipeline = (
    Pipeline()
    .add(mapper_germline)
    .add(mapper_tumor)
    .add(mdup_germline)
    .add(mdup_tumor)
    .add(base_racalibrator_germline)
    .add(base_racalibrator_tumor)
    .add(caller1)
    .add(caller2)
)

In [8]:
pipeline_config = pipeline.build()

In [9]:
pipeline_config["workdir"] = "/media/mae/SeagateExpansionDrive/arif/pipeline_reproduce/"

In [10]:
pipeline_config

{'library_path': '/home/mae/Desktop/hg38_bundle',
 'creation-date': '2021-09-11 16:47:16',
 'version': '0.0.1',
 'mapping': {'9870': {'library': 'bwa',
   'input': {'1': '/media/mae/SeagateExpansionDrive/arif/case_1_germline_wes/SRR3182423_1.fastq.gz',
    '2': '/media/mae/SeagateExpansionDrive/arif/case_1_germline_wes/SRR3182423_1.fastq.gz'},
   'output': 'unprocessed_9870.bam',
   'params': {'read_groups': {'ID': 'Pt28N',
     'SM': 'Pt28N',
     'PU': '0',
     'PL': 'illumina',
     'LB': 'Pt28N'}}},
  '00B3': {'library': 'bwa',
   'input': {'1': '/media/mae/SeagateExpansionDrive/arif/case_1_biorep_a_wes/SRR3182433_1.fastq.gz',
    '2': '/media/mae/SeagateExpansionDrive/arif/case_1_biorep_a_wes/SRR3182433_2.fastq.gz'},
   'output': 'unprocessed_00B3.bam',
   'params': {'read_groups': {'ID': 'S13',
     'SM': 'S13',
     'PU': '0',
     'PL': 'illumina',
     'LB': 'S13'}}}},
 'sorting': {},
 'index': {},
 'merge': {},
 'mdup': {'9870': {'input': 'unprocessed_9870.bam', 'output': 'm

In [11]:
with open("/home/mae/Desktop/cosap/snakemake_workflows/config.yaml", "w") as config_yaml:
            yaml.dump(pipeline_config, config_yaml, default_flow_style=False)

In [None]:
runner = PipelineRunner()

In [None]:
runner.run_pipeline_snakemake(pipeline_config=pipeline_config,
                              output_dir = "/media/mae/SeagateExpansionDrive/arif/pipeline_reproduce/")