# Local Mutation Reviewer Example

1. Install IGV here: https://software.broadinstitute.org/software/igv/download (tested on version 2.15)
1. BEFORE running the Mutation Reviewer:
    1. Open IGV
    1. Go to "Google" and log in
    1. Go to "Google" and enter google project id. This is required for requestor pays. If the mutations are loading but the bams are not, this is likely the problem.
1. Run the notebook

In [20]:
%load_ext autoreload
%autoreload 2

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [21]:
import pandas as pd
import numpy as np
import os
from MutationReviewer.Reviewers.MutationReviewer import MutationReviewer
import dalmatian

In [22]:
data_dir = './data/'
if not os.path.isdir(data_dir):
    os.mkdir(data_dir)
    
notebook_data_dir = f'{data_dir}/local_mutation_reviewer_example/'
if not os.path.isdir(notebook_data_dir):
    os.mkdir(notebook_data_dir)

In [4]:
analysis_workspace = 'broad-getzlab-ibm-taml-t/Ebert-Sperling_MDS-AML-pran-4_Claudia_v1'
wm = dalmatian.WorkspaceManager(analysis_workspace)
sample_bams_df = wm.get_samples()

In [30]:
mutsig_annot_maf_fn = 'gs://fc-secure-c220c99a-d38d-4e44-ac3f-093f46579d69/submissions/57ae3382-beee-47af-a5fa-d6ce33c09cc9/mutation_mutsig2cv_hg19/92ba2984-bfd8-4e49-8f8e-644bd7cec874/call-tool_mutsig2cv_hg19/5_0002_Discovery-Participants.final_analysis_set.maf'
mutsig_annot_maf_df = pd.read_csv(mutsig_annot_maf_fn, sep='\t', encoding='iso-8859-1')



Columns (47,48,54,69,88,100,143,147,150,153,154,156,163,164,176,179,181,187,223,229,233,235,236,237,253,262,288,317,320,326,333,344,365,383,390,393,394,397,401,403,404,406,411,413,414,419,429,433,477,484,487,488,491,495,497,498,500,505,507,508,513,523,527) have mixed types. Specify dtype option on import or set low_memory=False.



In [29]:
data_pkl_fn = f'{notebook_data_dir}/review_data.1.pkl'
review_description = 'Test reviewer'

In [37]:
reviewer = MutationReviewer()
reviewer = MutationReviewer()
reviewer.set_review_data(
    data_pkl_fn=data_pkl_fn, 
    description=review_description, 
    mutations_df=mutsig_annot_maf_df,
    bams_df=sample_bams_df.reset_index(),
    mutations_df_sample_col='patient', # on patient level
    chrom_col='chr',
    start_pos_col='pos',
    bam_df_sample_col='participant', # on patient level
    bam_col='gpdw_DNA_WES_icev1_cram_or_bam_path',
    bai_col='gpdw_DNA_WES_icev1_crai_or_bai_path'
)
reviewer.set_review_app(
    mutation_table_display_cols=['Hugo_Symbol', 'chr', 'pos', 'type', 'classification', 'gnomADg_AF', 't_alt_count', 't_ref_count', 'tumor_f', 'purity'],
    bam_table_display_cols=['sample_id', 'participant', 'gpdw_DNA_WES_icev1_cram_or_bam_path', 'gpdw_DNA_WES_icev1_crai_or_bai_path'],
    bai_col='gpdw_DNA_WES_icev1_crai_or_bai_path'
)
reviewer.set_default_review_data_annotations_configuration()


Loading existing data pkl file



In [38]:
reviewer.run(port=8088)

Dash app running on http://0.0.0.0:8088/
socket initialized
Position to view: 1:878,233-878,273
('gs://fc-02e4b730-cb29-48bb-9c3b-562e075457fe/Getz_Ebert_IBM_13-583_Exomes_35samples_Feb2020/RP-1886/Exome/JJ01222018BM/v2/JJ01222018BM.bam',)
socket closed
socket initialized
Position to view: 1:983,385-983,425
('gs://fc-02e4b730-cb29-48bb-9c3b-562e075457fe/Getz_Ebert_IBM_13-583_Exomes_164samples_Sept2019/RP-1886/Exome/PN01232018BM/v2/PN01232018BM.bam', 'gs://fc-02e4b730-cb29-48bb-9c3b-562e075457fe/Getz_Ebert_IBM_13-583_Exomes_35samples_Feb2020/RP-1886/Exome/PQ19066BM-H/v2/PQ19066BM-H.bam')
socket closed
