# Brain Commons - Parkinson's Progression Markers Initiative (MJFF-PPMI)

Import library with pipeline functions and GraphQL queries as well as our credentials:

In [None]:
%matplotlib inline
import bhc_analysis_functions as bc
bc.add_keys('credentials.json')

## 1. HIGH-LEVEL PYTHON LIBRARY BASED ON GRAPQH QUERIES

### Get summary counts for each data type in the project:

In [None]:
bc.query_summary_counts(["mjff-LRRK2", "mjff-PPMI"])

### Get counts per field:

In [None]:
# Any field in the model can be summarized:
disease_counts = bc.query_summary_field('primary_diagnosis', 'diagnosis')
race_counts = bc.query_summary_field('race', 'demographic')

## 2. PPMI DATA ANALYSIS AND SUMMARY STATISTICS

In [None]:
project_id = "mjff-PPMI"

### Summary statistics for demographic continous variables

In [None]:
bc.get_aggregated_statistics("mjff-PPMI", "demographic", ["Age", "Education"])

### Summary statistics for demographic categorical variables

#### Summary statistics for gender

In [None]:
bc.get_frequency_table(project_id, "demographic", "gender")

#### Summary statistics for race

In [None]:
bc.get_frequency_table(project_id, "demographic", "race")

### Summary statistics for assessment total scores

In [None]:
bc.get_assessment_statistics(project_id)

### Summary statistics for clinical test/exam variables

#### Datscan image exams (Specific Binding Ration - SBR)

In [None]:
datscan_variables = ["mean_putamen_sbr", "mean_caudate_sbr", 'mean_stratium_sbr']
bc.get_aggregated_statistics(project_id, "image_exam", datscan_variables)

#### Laboratory results from Cerebrospinal fluid (CSF)

In [None]:
lab_variables = ["csf_abeta", "csf_asyn", "csf_tau", "csf_ptau"]
bc.get_aggregated_statistics(project_id, "lab_result", lab_variables)

#### Questionnaire scores (longitudinal variables)

In [None]:
bc.get_followup_summary(project_id, "non_motor_assessment", "REM Sleep Disorder")

#### MRI Volume comparison (Wilcoxon non-parametric test)

Compare MRI Volume measures (banks superior temporal sulcus, caudal anterior cingulate and caudal middle frontal) for the PPMI cohort by genotype. 

A **Wilcoxon rank-sum statistical test (pvalue < 0.05)** is applied to determine statistically significant differences against a baseline genotype passed as parameter:

In [None]:
data_bank = bc.get_mri_subfield_by_genotype(project_id, 'apoe_genotype', 'Banks Superior Temporal Sulcus Volume', 'e2/e2')
data_cauant = bc.get_mri_subfield_by_genotype(project_id, 'apoe_genotype', 'Caudal Anterior Cingulate Volume', 'e2/e2')
data_caumid = bc.get_mri_subfield_by_genotype(project_id, 'apoe_genotype', 'Caudal Middle Frontal Volume', 'e2/e2')

### Summary statistics across projects

In [None]:
projects = ["mjff-PPMI", "mjff-LRRK2"]

#### Age at diagnosis

In [None]:
bc.get_summary_statistics(projects, "diagnosis", "Diagnosis Age")

#### LED in PD Subjects

In [None]:
bc.get_summary_statistics(projects, "medication", "LED", "PD")