## Notebook to runner for AMP-PD to scan risk for risk variants in replicated ieQTL results per interaction term via papermill

In [1]:
!date

Tue Jul  6 19:43:17 UTC 2021


#### import libraries

In [2]:
import pandas as pd
import os
import papermill as pm

In [3]:
# base notebook to be run per tuple iteration
base_notebook = '/home/jupyter/notebooks/replicated_ieqtl_scan_risk.ipynb'

# setup iteration tuples
disc_cohort = 'ppmi'
rep_cohort = 'pdbp'
tissue = 'wb'
terms = ['DX', 'GRS', 'Basophils', 'Eosinophils', 'Lymphocytes', 'Monocytes', 'Neutrophils']

#### iterate over the tuples running the notebook per tuple

In [4]:
%%time

out_nb_dir = f'/home/jupyter/notebooks/{disc_cohort}/pm_gend_nbs'
# make sure the notebook output dir exists
os.makedirs(out_nb_dir, exist_ok=True)
wrk_dir = f'/home/jupyter/{disc_cohort}'
for term in terms:
    # before running prep notebook make results exist for the cohort and visit
    results_file = f'{wrk_dir}/results/{disc_cohort}.{tissue}.{term}.cis.ieqtl.csv'
    if os.path.isfile(results_file):
        param_dict = {'disc_cohort': disc_cohort, 'rep_cohort': rep_cohort, 
                      'tissue': tissue, 'interaction_term': term}
        out_notebook = f'{out_nb_dir}/{disc_cohort}.{tissue}.{term}.replicated_ieqtl_scan_risk.ipynb'
        print(param_dict)
        print(out_notebook)
        try:
            pm.execute_notebook(input_path=base_notebook, output_path=out_notebook, 
                                parameters=param_dict)
        except:
            print(f'{disc_cohort}.{tissue}.{term} encountered an error continuing on next')                

{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'DX'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.DX.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

ppmi.wb.DX encountered an error continuing on next
{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'GRS'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.GRS.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'Basophils'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.Basophils.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'Eosinophils'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.Eosinophils.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'Lymphocytes'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.Lymphocytes.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'Monocytes'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.Monocytes.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

{'disc_cohort': 'ppmi', 'rep_cohort': 'pdbp', 'tissue': 'wb', 'interaction_term': 'Neutrophils'}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi.wb.Neutrophils.replicated_ieqtl_scan_risk.ipynb


Executing:   0%|          | 0/51 [00:00<?, ?cell/s]

CPU times: user 31.4 s, sys: 1.16 s, total: 32.6 s
Wall time: 1h 7min 11s
