# Create Heatmap 

This notebook looks at the significant genes in at least one cancer. Pancancer heatmaps are created with circle size showing significance and color showing differences in median.

In [1]:
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
import scipy.stats
import gseapy as gp
import re
import sys 

import cptac
import cptac.utils as u
import plot_utils as p

# Run GSEA

In [3]:
sig_df = pd.read_csv('Make_Tables\csv\sig_pval_heatmap.csv')
print('sig in one cancer:', len(sig_df.Proteomics.unique()))
print('sig in mult cancers: 0')

sig in one cancer: 29
sig in mult cancers: 0


In [58]:
prot_list = list(sig_df.Proteomics.unique()) 
prot_enr = gp.enrichr(gene_list = prot_list, description='Tumor_partition', gene_sets='Reactome_2016', 
                       outdir='/Enrichr')



In [59]:
prot_enr.res2d.head()

Unnamed: 0,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes,Gene_set
0,Extrinsic Pathway of Fibrin Clot Formation Hom...,1/5,0.00723,1.0,0,0,137.931034,679.940112,F3,Reactome_2016
1,Urea cycle Homo sapiens R-HSA-70635,1/10,0.014409,1.0,0,0,68.965517,292.407787,CPS1,Reactome_2016
2,Rap1 signalling Homo sapiens R-HSA-392517,1/16,0.022958,1.0,0,0,43.103448,162.676706,RAP1GAP2,Reactome_2016
3,TNF receptor superfamily (TNFSF) members media...,1/17,0.024376,1.0,0,0,40.567951,150.676386,TNFRSF12A,Reactome_2016
4,Regulation of Insulin-like Growth Factor (IGF)...,1/21,0.030027,1.0,0,0,32.840722,115.128225,MMP1,Reactome_2016


# Make Heatmap

In [21]:
sig_df = sig_df.loc[sig_df['P_Value'] < 0.05]

In [34]:
p.plotCircleHeatMap(sig_df, circle_var = 'P_Value', color_var='Medians', x_axis= 'Proteomics', y_axis = 'Cancer',
                    plot_height=400, plot_width= 800, legend_min = .01, legend_max = 0.05, save_png = 'KRAS_2.png')

# G12

In [51]:
g12 = [' GPRC5A', 'BCAT2', 'ETFB', 'ETFA']
prot_list = list(sig_df.Proteomics.unique()) # list of genes with a sig pval in mult cancers
prot_enr = gp.enrichr(gene_list = g12, description='Tumor_partition', gene_sets='Reactome_2016', 
                       outdir='/Enrichr')



In [52]:
prot_enr.res2d.head()

Unnamed: 0,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes,Gene_set
0,Respiratory electron transport Homo sapiens R-...,2/88,0.000114,0.174701,0,0,113.636364,1031.556981,ETFA;ETFB,Reactome_2016
1,"Respiratory electron transport, ATP synthesis ...",2/109,0.000175,0.134124,0,0,91.743119,793.474108,ETFA;ETFB,Reactome_2016
2,The citric acid (TCA) cycle and respiratory el...,2/153,0.000345,0.176126,0,0,65.359477,520.978293,ETFA;ETFB,Reactome_2016
3,Metabolism Homo sapiens R-HSA-1430728,3/1908,0.00322,1.0,0,0,7.861635,45.112456,ETFA;ETFB;BCAT2,Reactome_2016
4,Branched-chain amino acid catabolism Homo sapi...,1/23,0.004592,1.0,0,0,217.391304,1170.296343,BCAT2,Reactome_2016


In [47]:
g12_sig_df = pd.read_csv('Make_Tables\csv\sig_pval_heatmap_G12.csv')
print('sig in one cancer:', len(g12_sig_df.Proteomics.unique()))
print('sig in mult cancers: 0')

sig in one cancer: 4
sig in mult cancers: 0


In [48]:
g12_sig_df = g12_sig_df.loc[g12_sig_df['P_Value'] < 0.05]

In [50]:
p.plotCircleHeatMap(g12_sig_df, circle_var = 'P_Value', color_var='Medians', x_axis= 'Proteomics', y_axis = 'Cancer',
                    plot_height=400, plot_width= 400, legend_min = .01, legend_max = 0.05, save_png = 'KRAS_G12.png')