In [1]:
%load_ext autoreload
%autoreload 2
%reload_ext autoreload
from matplotlib_venn import venn2
import pandas as pd

### [PMID_32299494](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7164172/)

An analysis of genetically regulated gene expression across multiple tissues implicates novel gene candidates in Alzheimer’s disease

In [2]:
PMID_32299494_CMC = pd.read_csv('../../resources/AD-genes/PMID_32299494/Table6.csv')
genesd = {}
genesd['PMID_32299494_CMC'] = pd.DataFrame({'Gene': PMID_32299494_CMC['Gene'], 'PMID': 32299494, 'Method': 'S-PrediXcan', 'Tissue': 'DLPFC'})

In [3]:
PMID_32299494_FOCUS = pd.read_excel('../../resources/AD-genes/PMID_32299494/13195_2020_611_MOESM6_ESM.xlsx', sheet_name='focus_results')
PMID_32299494_FOCUS = PMID_32299494_FOCUS.loc[PMID_32299494_FOCUS['pip'] > 0.25, :]
genesd['PMID_32299494_FOCUS'] = pd.DataFrame({'Gene': PMID_32299494_FOCUS['mol_name'], 'PMID': 32299494, 'Method': 'FOCUS', 'Tissue': PMID_32299494_FOCUS['tissue']})

### [PMID_33417599](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7819609/)

Identifying drug targets for neurological and psychiatric disease via genetics and the brain transcriptome

In [4]:
PMID_33417599_MR = pd.read_csv('../../resources/AD-genes/PMID_33417599/journal.pgen.1009224.s005.csv')
PMID_33417599_MR = PMID_33417599_MR.loc[PMID_33417599_MR['outcome (trait)'] == 'AD', ]
genesd['PMID_33417599_MR'] = pd.DataFrame({'Gene': PMID_33417599_MR['exposure (gene)'], 'PMID': 33417599, 'Method': 'MR', 'Tissue': 'DLPFC'})

### [PMID_30617256](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6836675/)

Genome-wide meta-analysis identifies new loci and functional pathways influencing Alzheimer’s disease risk

In [5]:
PMID_30617256 = pd.read_excel('../../resources/AD-genes/PMID_30617256/NIHMS1031924-supplement-Supplemental_Tables.xlsx', sheet_name='Table S19', skiprows=4)
PMID_30617256 = PMID_30617256.loc[~ PMID_30617256.Gene.isna(),]
genesd['PMID_30617256'] = pd.DataFrame({'Gene': PMID_30617256['Gene'], 'PMID': 30617256, 'Method': 'multiple', 'Tissue': 'multiple'})

### [PMID_30820047](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6463297/)

Genetic meta-analysis of diagnosed Alzheimer’s disease identifies new risk loci and implicates Aβ, tau, immunity and lipid processing

In [6]:
PMID_30820047_MR = pd.read_excel('../../resources/AD-genes/PMID_30820047/NIHMS1021255-supplement-S3.xlsx', sheet_name='Supplementary Table 15', skiprows=2)
PMID_30820047_MR = PMID_30820047_MR.loc[~ PMID_30820047_MR['PSMR FDR'].isna(),]
genesd['PMID_30820047_MR'] = pd.DataFrame({'Gene': PMID_30820047_MR['Gene'], 'PMID': 30820047, 'Method': 'SMR-Heidi', 'Tissue': 'blood'})

In [11]:
{k: len(v) for k, v in genesd.items()}

{'PMID_32299494_CMC': 12,
 'PMID_32299494_FOCUS': 16,
 'PMID_33417599_MR': 15,
 'PMID_30617256': 16,
 'PMID_30820047_MR': 22}

In [12]:
genes = pd.concat(genesd.values())
genes.Gene.value_counts()

MS4A6A          5
CR1             4
PTK2B           4
SPI1            3
PVR             3
BIN1            3
CLU             2
CLPTM1          2
HLA-DRB1        2
MS4A2           2
MS4A4A          2
TOMM40          2
HLA-DRA         1
IGSF23          1
EML2            1
MYBPC3          1
EPHA1           1
PVRIG           1
UNC79           1
BCAM            1
TSPAN14         1
AP4M1           1
CCNT2-AS1       1
AC012146.1      1
CEACAM19        1
GRIK4           1
ZNF223          1
APOE            1
AC135050.3      1
X84075          1
TAS2R60         1
ZNF646          1
KAT8            1
HLA-DQA1        1
CCDC6           1
PILRB           1
ZNF221          1
SLC26A9         1
PRSS36          1
APOC1           1
CUGBP1          1
FZD4            1
ZNF284          1
AP2A2           1
IRF2BP1         1
RP5-935K16.1    1
ACE             1
ZNF222          1
REEP6           1
DMWD            1
MAP3K2          1
TRAPC6A         1
SCIMP           1
MS4A3           1
APOC4           1
PVRL2     

In [9]:
%connect_info

{
  "shell_port": 55799,
  "iopub_port": 60023,
  "stdin_port": 37489,
  "control_port": 51051,
  "hb_port": 40167,
  "ip": "127.0.0.1",
  "key": "5d7d4bf7-b7cddd8378dc4de9e3e5a56c",
  "transport": "tcp",
  "signature_scheme": "hmac-sha256",
  "kernel_name": ""
}

Paste the above JSON into a file, and connect with:
    $> jupyter <app> --existing <file>
or, if you are local, you can connect with just:
    $> jupyter <app> --existing kernel-b72ebfc8-2d50-4953-a1cb-e29e7083267b.json
or even just:
    $> jupyter <app> --existing
if this is the most recent Jupyter kernel you have started.
