## Notebook to runner for AMP-PD to compare cohort's per visit eQTS results via papermill

In [1]:
!date

Mon May 10 21:36:00 UTC 2021


#### import libraries

In [2]:
import pandas as pd
import os
import papermill as pm

In [3]:
# base notebook to be run per tuple iteration
base_notebook = '/home/jupyter/notebooks/compare_visit_eqts_results.ipynb'

# setup iteration tuples
cohorts = ['biofind', 'pdbp', 'ppmi']
tissue = 'wb'
months = [0, 1, 6 , 12, 18, 24, 36]
quant_type = 'genes'

#### iterate over the tuples running the notebook per tuple

In [4]:
%%time

for cohort in cohorts:
    out_nb_dir = f'/home/jupyter/notebooks/{cohort}/pm_gend_nbs'
    # make sure the notebook output dir exists
    os.makedirs(out_nb_dir, exist_ok=True)
    wrk_dir = f'/home/jupyter/{cohort}'
    visits = []
    for month in months:
        # before running prep notebook make results exist for the cohort and visit
        results_file = f'{wrk_dir}/eqts/{cohort}.{tissue}{month}.eqts.csv'
        if os.path.isfile(results_file):
            visits.append(month)
    if len(visits) > 1:            
        param_dict = {'cohort': cohort, 'tissue': tissue, 'months': visits}
        out_notebook = f'{out_nb_dir}/{cohort}_compare_visit_eqts.ipynb'
        print(param_dict)
        print(out_notebook)
        pm.execute_notebook(input_path=base_notebook, output_path=out_notebook, 
                            parameters=param_dict)

{'cohort': 'pdbp', 'tissue': 'wb', 'months': [0, 6, 12, 18, 24]}
/home/jupyter/notebooks/pdbp/pm_gend_nbs/pdbp_compare_visit_eqts.ipynb


Executing:   0%|          | 0/19 [00:00<?, ?cell/s]

{'cohort': 'ppmi', 'tissue': 'wb', 'months': [0, 6, 12, 24, 36]}
/home/jupyter/notebooks/ppmi/pm_gend_nbs/ppmi_compare_visit_eqts.ipynb


Executing:   0%|          | 0/19 [00:00<?, ?cell/s]

CPU times: user 1.14 s, sys: 82.1 ms, total: 1.22 s
Wall time: 6.31 s
